diff --git a/figures/benchmark.jpg b/figures/benchmark.jpg index d1fd67ec1bf748c24b244b6efd825ded1b147787..32d5f6c1718a3c23a8fb0dcd76a3ba0fa097e3fe 100644 Binary files a/figures/benchmark.jpg and b/figures/benchmark.jpg differ diff --git a/model-00004-of-000163.safetensors b/model-00004-of-000163.safetensors index f1cf26f5d9386b3f8234853c58fbc5bf28e60bef..dda9a76e7d51bc68db866d32b6ba9df8fca74f72 100644 --- a/model-00004-of-000163.safetensors +++ b/model-00004-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad5ca32dcb6c50a954bbeac833f767fcfe398b0d05aea63473907322c1a5bed5 -size 4302349996 +oid sha256:3a9fffda0b2c62ba57e87a9a246113fc3ceb45aa256cf9ff9fdd75dd345a2521 +size 8598786296 diff --git a/model-00005-of-000163.safetensors b/model-00005-of-000163.safetensors index f43f0f79f06c1dc6fe476dc89a662db70fa191ef..9c7bdc7a83d0c2997a922fe762de325b89750049 100644 --- a/model-00005-of-000163.safetensors +++ b/model-00005-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e06768f65df4c19a033253a1994fe7145be9ce28131398ad9f320e3d03e8ab73 -size 4302384154 +oid sha256:59baf5fe1862df4db604533931b07fcb97596712a094851cf85793dc4452c268 +size 8602554048 diff --git a/model-00006-of-000163.safetensors b/model-00006-of-000163.safetensors index c4110d6688e08eae0967b40d38d1e3b923d010ef..580bee5c7888356a962f6f43b6404dc832203f09 100644 --- a/model-00006-of-000163.safetensors +++ b/model-00006-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3eb84d165db019a61e5ca4754d3c6c6aa298b88af5a7617b15b0eca42f64e14f -size 4372073602 +oid sha256:2cfa5d5f02c7ab85d47e07e82cb9353232a842aad2f4747b01489956bf4845df +size 8741916520 diff --git a/model-00007-of-000163.safetensors b/model-00007-of-000163.safetensors index e228832ac4bb2943f78bc576e9b492679429bb86..f2e037a7d7b59fbf9eb4146d9108892a65cbf026 100644 --- a/model-00007-of-000163.safetensors +++ b/model-00007-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d6f299f7b410b9a7806927b5d2d413fae1f2c1dfa340bb0037d02d220cd8c080 -size 4306080097 +oid sha256:4b6f2cdd5392caaa845e140b7f178e4406043771f0d277ad1d92b5cf36a3238b +size 8606225096 diff --git a/model-00008-of-000163.safetensors b/model-00008-of-000163.safetensors index 5671e6efb430436988358b05c8c11e2df21f2303..e23202075aa54e6c6a901ac4b1c518fc5fdb8287 100644 --- a/model-00008-of-000163.safetensors +++ b/model-00008-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:da197fe67d243284d133310255e436759ea1eff8c3f2a684da53496a76d11ce2 -size 4302384356 +oid sha256:fdf1644b293adcf07b9d708f5d385f43575fd2fe962c6d766e48c84f1684d235 +size 8602554144 diff --git a/model-00009-of-000163.safetensors b/model-00009-of-000163.safetensors index d161b640038bf3f20c777fb43725633692894ee9..42f5572a5f437cbcd3d000b544c8d23a7fea2d4c 100644 --- a/model-00009-of-000163.safetensors +++ b/model-00009-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dbd2a790cc3d94aa3d13a0301e23de8bb81e0168e100650dbcac36695533e1d3 -size 4302350190 +oid sha256:b36db93b74136b8852d062c85e764ae4356c3857751c5430d3c33e01bf2fbf91 +size 8598786392 diff --git a/model-00010-of-000163.safetensors b/model-00010-of-000163.safetensors index 61c0a36b9130ebaa6ebb8e77af7ff0fe60a407a8..5abc24a9eff3dc8dc69c192480b79f14fb4477d2 100644 --- a/model-00010-of-000163.safetensors +++ b/model-00010-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:137f0f0407290d8d45d1a3f60c67aa10a2a5434e95d8d07eaf82df6f475d8cf8 -size 4302383960 +oid sha256:ff5bdffc3fca98f7c43b91b12bd0df70661b656050f0fd3ac7f7f1849d580b1a +size 8602553952 diff --git a/model-00011-of-000163.safetensors b/model-00011-of-000163.safetensors index 461591944352ca2c0c3263939451af8e19f17baf..25274f247e6fa94ef5ed8dff617f581a36a471e7 100644 --- a/model-00011-of-000163.safetensors +++ b/model-00011-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:47b308ea2f7f7a4a812a28c0a5c75d5f648a08b0c118bd0863fd2f7320e6bc76 -size 4302384375 +oid sha256:10faa73df07efcc7961c547b5cb93cf17d612d32ef52e9830b4260d0ce63d95a +size 8602554152 diff --git a/model-00012-of-000163.safetensors b/model-00012-of-000163.safetensors index 9fdbd8e623da43069be4cfcc0420d67b63ac52df..071aab62b8ff764eb51a3bf133fa992f1b2b9ef8 100644 --- a/model-00012-of-000163.safetensors +++ b/model-00012-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4cda99d04536d50e067c3a2c8c9ead34d307b2002500b1a8b8c7ad4ac85a9061 -size 1321583941 +oid sha256:e204197e2af834ebfd4af43526914503fadfa58796b4705579314f4e9887324d +size 2642451624 diff --git a/model-00013-of-000163.safetensors b/model-00013-of-000163.safetensors index dd20e3f278e8ee984012f557073e6363582e4560..9d7b6572477f3d35f0b490c34d48e409f3993821 100644 --- a/model-00013-of-000163.safetensors +++ b/model-00013-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33adbb52d544cac90603081e871ff3260ee993c479fd96194716da54cfc57040 -size 4302317244 +oid sha256:d039dcb1f0f65987e36d045006f139b8d6c99fe8a9373a70c70991213cfa9f43 +size 8598757320 diff --git a/model-00014-of-000163.safetensors b/model-00014-of-000163.safetensors index d3ad29b9118525e07dcbbaa0381238dd7b0c238a..a538006474d018b579e143b2dbb9c68667a6d736 100644 --- a/model-00014-of-000163.safetensors +++ b/model-00014-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:05b19f1bd14644e5e6db24575322d3e74a611f26b71a8021345caf0d9b416fd9 -size 4302384328 +oid sha256:97d7725d9ef598faba4f1284cab74b1ae32cdfd02b828079b904a52eba0d7b8e +size 8602554136 diff --git a/model-00015-of-000163.safetensors b/model-00015-of-000163.safetensors index 0a2e60a20434d81f672e64b9a6ff6e92122ef16b..85d1512cba65b0ffd4e269d950c84be260c7fd16 100644 --- a/model-00015-of-000163.safetensors +++ b/model-00015-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0484ca365f84ed446f992e3e43eeb4e182a05c8d554be385f1e1535d4d80f4fe -size 4302350218 +oid sha256:a46d3ea85ba43a66193d0f7546ec1c936a4b211fad91188ab8f43093b60f4d37 +size 8598786408 diff --git a/model-00016-of-000163.safetensors b/model-00016-of-000163.safetensors index cea2a7c549de6bf7e55d17b331ee028d8c6d71aa..1fe5502de8b035b46ed089b714e4bc8539a21ace 100644 --- a/model-00016-of-000163.safetensors +++ b/model-00016-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a70800c3373608f3b3f8dd4643c9574360896e3dd647acb39f4e794284e6ee6 -size 4302383932 +oid sha256:b6630ebc4caf694bb3918918a0a06dd00f3228c764f0725bebacc7d7c02c935e +size 8602553936 diff --git a/model-00017-of-000163.safetensors b/model-00017-of-000163.safetensors index f29605becbd55050b9f5ec1256218fb326bbbb01..8469c5cc489ee8ab4323d167115d5f1677f878f1 100644 --- a/model-00017-of-000163.safetensors +++ b/model-00017-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bd5abae258a54b0b4ded4f85c272b34a05f968b32dfc46412af8f5775b95ece9 -size 4302384377 +oid sha256:becb73788e18f5b3ab21e4aaa0ed846791b9b062c247fed8daf48da3006e463c +size 8602554152 diff --git a/model-00018-of-000163.safetensors b/model-00018-of-000163.safetensors index a189957b40d5e5e7c7fc7be88c68ef9470da1cea..f7bc4b2d46db79f58171d5a6ad982e2232d2366a 100644 --- a/model-00018-of-000163.safetensors +++ b/model-00018-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b5418a2987ad8d4a188592c014fbb107f7605266375c5b29d42b50d449a0a9b0 -size 4302350026 +oid sha256:3b9d024b0e6b87889bdae11855048dd7dc26df21bc1b354962b270cfb7ea551c +size 8598786312 diff --git a/model-00019-of-000163.safetensors b/model-00019-of-000163.safetensors index 5fb550a44397287a71b8a2f3b90dee73444b3222..b13e60bf2ac9811e46e42732c52eb35ef71711a7 100644 --- a/model-00019-of-000163.safetensors +++ b/model-00019-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:69bbd687eafeb7e7d7ff111af3233a10e7c74c459b6d3b466a7d93f6878d4915 -size 4302384124 +oid sha256:a49fb1889fd754eb3db9b25dbea6ebb5f152b1f98b9374157306c258b997e540 +size 8602554032 diff --git a/model-00020-of-000163.safetensors b/model-00020-of-000163.safetensors index 00ca3f8d5ac1edd6613c6117ef5cce3785d495e1..8e6d79147029ae5744884ea8788f5df099dfa554 100644 --- a/model-00020-of-000163.safetensors +++ b/model-00020-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2560e878221496c2326c0538d7898e28b30cec87c70c599b321c4292bac91fe1 -size 4302384377 +oid sha256:e039712e7b55545d7a5e26d99c2c37f23d354b09c773251da9d95d2f91f79ae2 +size 8602554160 diff --git a/model-00021-of-000163.safetensors b/model-00021-of-000163.safetensors index 87d7c4d75a2c621f9b31fad331b634ad4085be1a..7eaa34f5188487a6452cd6bfa5b53ad8aa388dea 100644 --- a/model-00021-of-000163.safetensors +++ b/model-00021-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:09e6825f850ba74ac9293d8179b3e7ebe3a69a3193fb0a129bf5dcaebf0b6201 -size 4302350413 +oid sha256:6759dceaf8e72b62eca652da8cc923102f5d00d6b2a4b17c8b2b7d582fcab5a5 +size 8598786512 diff --git a/model-00022-of-000163.safetensors b/model-00022-of-000163.safetensors index ecafc13392ff21983580d519da6a09e2df05c7a7..61b730e77c8b2f653bd72314ca5c8fbad265d98c 100644 --- a/model-00022-of-000163.safetensors +++ b/model-00022-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:083a0025a915e3eb8077b24abf6d26cbbf60709f308e6eaec4a3121ab368788f -size 4302384900 +oid sha256:3f73806d4cb4f80e744b6dd6a79bd97d4c9466e48a7191066cb154f19a650fee +size 8602554416 diff --git a/model-00023-of-000163.safetensors b/model-00023-of-000163.safetensors index 332bad40e536e7b24d02d787ce66182d148f34e0..05579c1a3b6676bdeed07fa139ac9d3801ee2ccd 100644 --- a/model-00023-of-000163.safetensors +++ b/model-00023-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a10ddf9357a7603dc603fa1bbc4e0e947637f33cb6f2bfc0725a721f93622342 -size 4302350808 +oid sha256:b41bc4167b28a28ebf96c29ab7d744f46398030c0de383a091c27d2b378fabb7 +size 8598786704 diff --git a/model-00024-of-000163.safetensors b/model-00024-of-000163.safetensors index a43cd5b37a4f5ddb6b1caf3df1c55a2d53f67fba..8f42da3d72181ef2125e5c80a3c6eca86e683cad 100644 --- a/model-00024-of-000163.safetensors +++ b/model-00024-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f13210eca8ecf63123dce2ebcc9de5833b6d31b47f85970b6e6f7f00997ef78 -size 4302384504 +oid sha256:8a1e67fa44a09a698e070f0f81f637c1bca664ed40e45f24c9a307c076ae64fc +size 8602554224 diff --git a/model-00025-of-000163.safetensors b/model-00025-of-000163.safetensors index 42dc014a993e017ecc0bddf90b9a0ade6cc336ce..1f4a127f9ae653753fea001bba50f4afdc8ceaeb 100644 --- a/model-00025-of-000163.safetensors +++ b/model-00025-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d511a1879fd6cdba6823f29af05242e3f46374eec1d957a5b4db01c5d83ebc8c -size 4302384961 +oid sha256:40f972cced4deee0e61071ed94ce998d099083cf4be8b431efb06ab5d105e313 +size 8602554448 diff --git a/model-00026-of-000163.safetensors b/model-00026-of-000163.safetensors index 3a3917b0f25ab2eb9e5a00667f203eb572b57450..b43bf34a274f70402e9431b5b7b74722ef251246 100644 --- a/model-00026-of-000163.safetensors +++ b/model-00026-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0c50460d2ee189e76fc3eb111ef0ecd4d28dd05b5bca619bdd122827fca31e10 -size 4302350620 +oid sha256:4c7bf2562f107c268579a8cdae8e87e165b0c780fd7166094d4d5632b5b04b10 +size 8598786616 diff --git a/model-00027-of-000163.safetensors b/model-00027-of-000163.safetensors index 32d76986fa61570df617850ad1d43ddf94f350fb..b173190acd0abc7be2c9377d228937c47a983a7d 100644 --- a/model-00027-of-000163.safetensors +++ b/model-00027-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:260ad43d8099317e55c97d7931941419d04a45f2169967328dd721104f9ed63d -size 4302384692 +oid sha256:c72f7f985dc12fa4e9105c55eecb9be6139b78ed17713e70013af7f375d9c929 +size 8602554312 diff --git a/model-00028-of-000163.safetensors b/model-00028-of-000163.safetensors index f1301d3d37d68e1c03a4aec067143c5d18a15ea3..1e203d0e7d4b48d4b665aaef5e7eba415f0151bb 100644 --- a/model-00028-of-000163.safetensors +++ b/model-00028-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1acbd0856de26f397bef297165e6a12d2fd419fdda8237891b0da5c43c27a2a9 -size 4302384963 +oid sha256:ea9febe137ad6c326eea88e093218e28fb22fea439319025eb89e5032af7f851 +size 8602554448 diff --git a/model-00029-of-000163.safetensors b/model-00029-of-000163.safetensors index 3cb66baeb7d3bc557830e9a38d1006a0092e8503..21564b6062a526deac44314bc176d3ad18368e61 100644 --- a/model-00029-of-000163.safetensors +++ b/model-00029-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:20d3ef472a46a6c7d340476b6ac105c7502ce71d1903022502cc5069c1971792 -size 4302350448 +oid sha256:51e0500521bba5dbd8faf94bc68af7b3b6197b67498cc5f078e4e2199b14a890 +size 8598786520 diff --git a/model-00030-of-000163.safetensors b/model-00030-of-000163.safetensors index 5816afae4d9c56eac723b16cb7fe4554729b6d83..0734f2a853a54739403af5aa17f9baa8bfd236bb 100644 --- a/model-00030-of-000163.safetensors +++ b/model-00030-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ac1d12d32f3a95e111cfd09f0255ed6af2b9237187aef1dcf78230c1f637abdd -size 4302384884 +oid sha256:fc3a398e0e0dd6995c4731f7333830ae359882a994e1790d2045e1ff4e7681ed +size 8602554408 diff --git a/model-00031-of-000163.safetensors b/model-00031-of-000163.safetensors index 963bf57a208411dd4512ac2823c93c01c57ee622..d62effe197f2a2f31e938aa0456b2fe38ab43ef1 100644 --- a/model-00031-of-000163.safetensors +++ b/model-00031-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eace4ef31c4ff04f22501b93eb476fd8e0289c749d0dd30c9c510ec520b98055 -size 4302350824 +oid sha256:3d81fe26a786ed8d4238b0ffd976ead048075cfd4ee5222c02b34e5727d3b373 +size 8598786720 diff --git a/model-00032-of-000163.safetensors b/model-00032-of-000163.safetensors index 30c904d3366a50afd2676c33b09ac5be5359ad82..076500e86f61190d80907a4caa6d57469e8c8ef4 100644 --- a/model-00032-of-000163.safetensors +++ b/model-00032-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ac7f5250660b596b6e3c430c9f0d3139b0e6b7aa1fc08069dc0e3966f08c92bf -size 4302384488 +oid sha256:e8e98fbd5a8c8ec709c86608faca725309041203a71b1ea3ee20ccac1575013a +size 8602554208 diff --git a/model-00033-of-000163.safetensors b/model-00033-of-000163.safetensors index cf2d6c87f60a05333b1f84a665e0afa72e896520..32db6941a1f79dddf0eca38efcab694cc5af8d15 100644 --- a/model-00033-of-000163.safetensors +++ b/model-00033-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f71549c7a33eaacdff8a2406a82957562404548a7fe5f2130a3573b36dbddef0 -size 4302384963 +oid sha256:16043317a49e745e5743194920d6d5cf73472d5e7581b5197407465903525196 +size 8602554448 diff --git a/model-00034-of-000163.safetensors b/model-00034-of-000163.safetensors index 877026bf7ddc5ee84e5873e33bc284fb5cfaa41f..d5c834a9e1b6ba151e599342dd70db4cf3375bb1 100644 --- a/model-00034-of-000163.safetensors +++ b/model-00034-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dc52ac9cd64be1135b3ed03df71d9c63af56b62738156b95af65b3400abe781f -size 1747417474 +oid sha256:8bdf4e8779f20854d43608277dec089d72b547c5636c5cf6e1b1cc8a3488e18d +size 3493899088 diff --git a/model-00035-of-000163.safetensors b/model-00035-of-000163.safetensors index 16106729d3b99b1ee0e8a4add6f723721e96b925..72cbbdfa3b9252e1397f9148aee88766ce97aa51 100644 --- a/model-00035-of-000163.safetensors +++ b/model-00035-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f4677233a2a36db63ea5fb010dc3a5ef882285f3ceb2c428ba4c1cdae9ed585 -size 4302317817 +oid sha256:0dc868c6f6dee0fa07b69700ff7c2669d32bbe44b4c3e809d202930f5851bbef +size 8598757608 diff --git a/model-00036-of-000163.safetensors b/model-00036-of-000163.safetensors index a04c52a614fa2fbf577a44ca5d89e0367b5ff6b0..5e9e45e453200240048196f12a95b19c8d49434c 100644 --- a/model-00036-of-000163.safetensors +++ b/model-00036-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f0b62c567e3c9e0bcf51bcd994d0ed67d5df44c2cadcf407522e445be8ecf6b2 -size 4302384914 +oid sha256:663c4175d3c9dcda7e3233e497a2b8eba354f9b5ba08f41201109e5cb111fa11 +size 8602554424 diff --git a/model-00037-of-000163.safetensors b/model-00037-of-000163.safetensors index 0065b22d1bec8188c3edaef579f7c46a99e453c6..abb0584fe3ece056b6360d797bef17d9e4bdcd83 100644 --- a/model-00037-of-000163.safetensors +++ b/model-00037-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9d7c8a1c35d1df030c95186eb6acaceebabbef95374de6c8a385c4b87e1895d2 -size 4302350794 +oid sha256:7116de8fdf43da16827efb71433a60424358a36573d060626a6e647d571326e2 +size 8598786704 diff --git a/model-00038-of-000163.safetensors b/model-00038-of-000163.safetensors index cf8194ed5e74aea33e4a9133a728fa2f86d335cb..be8838dca7fb052e5fe0a8be64969df99f36ff69 100644 --- a/model-00038-of-000163.safetensors +++ b/model-00038-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ea241680b9422782815a20eb1d7a99e37a65260b08a17557e946b9c20219649d -size 4302384518 +oid sha256:21723ffa0998ec533df4021b821518668f298f644d1a26b300cd8552128d6b99 +size 8602554224 diff --git a/model-00039-of-000163.safetensors b/model-00039-of-000163.safetensors index 0b054983d63c72fcf36975a866fa7d31dbcb7504..35433ae17f0fc3aca94161ec18d4de9868447f08 100644 --- a/model-00039-of-000163.safetensors +++ b/model-00039-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6dfd35cf8163ebcdd73ee4cc6beacf011b1d00f82b842fc3d914f7230e52800b -size 4302384963 +oid sha256:a16ede8ff7d1e2fb96a9ade240f30aebdf9aec0c033eeab66869be3ffde9be4e +size 8602554448 diff --git a/model-00040-of-000163.safetensors b/model-00040-of-000163.safetensors index cf198ad60893f0d49d96fbae43a075a215ad8ca4..8808ceff8d282c3071fd504fb7668c53b461d2e8 100644 --- a/model-00040-of-000163.safetensors +++ b/model-00040-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fc4c69c0e91ece15f1a1bc0bf17e1d36c514bbb138c1412a0ced41118d75a052 -size 4302350602 +oid sha256:51f26d9fb09724bd77af78f97e0f8180e323e163a1186424dc74f8877aa12ed8 +size 8598786608 diff --git a/model-00041-of-000163.safetensors b/model-00041-of-000163.safetensors index 2c81bb9c4d9910442e57609c9d10bfcb12ff8fd8..9d1304cd6817115a75abb696ad139adc9842107f 100644 --- a/model-00041-of-000163.safetensors +++ b/model-00041-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:333c52631a3de667f9c4a01dd644a9520832ca4a933be7c6ddfdfe6525573c3e -size 4302384710 +oid sha256:e77668a49e7785b1d8a5e2ceb4875c87cfe9ecac51e1ee420bc41ef8fb167a97 +size 8602554320 diff --git a/model-00042-of-000163.safetensors b/model-00042-of-000163.safetensors index 8578ecbb4ba55968e052af2c3d06f75d8aad3402..44bc2e278f36bfd20eac7e0bb201836af4f4c1c6 100644 --- a/model-00042-of-000163.safetensors +++ b/model-00042-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:450f75fd01ff57776f0679d9b3c819be08d7057e265d43dda2c65d4851efd89d -size 4302384963 +oid sha256:a3a0f94bdb238df8e9504fb349634fb76be37f60952ee3f64b6c529445a45766 +size 8602554448 diff --git a/model-00043-of-000163.safetensors b/model-00043-of-000163.safetensors index 3e8656244e49db124b5f863c515a4726411ee29b..ba83c5dfc47b86e96833e8a4c6ae4f2cdc797968 100644 --- a/model-00043-of-000163.safetensors +++ b/model-00043-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aab6deabc7117de24a14a81aae0c5ff6e10be064913cc48b21d9a89fa511b45c -size 4302350432 +oid sha256:e495f6da3338565b81305ca1e2ed925f6de504c4928cd17ae7eb03ea0b8be695 +size 8598786504 diff --git a/model-00044-of-000163.safetensors b/model-00044-of-000163.safetensors index af903f1f8943744291327c16facc2d0f2a2c5a93..bcae9244a0d5d5eb55d1ee88aedf7e902958d298 100644 --- a/model-00044-of-000163.safetensors +++ b/model-00044-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9d6582f530adcf2c8b864bd9344652fd0bb939360e7c30f6e47bc09986cc576 -size 4302384900 +oid sha256:6e7947a7ac8b51f9c73731f5de9b2398238cee5ef8a9bfded3797473b498f3d0 +size 8602554416 diff --git a/model-00045-of-000163.safetensors b/model-00045-of-000163.safetensors index 7a3fb9642264f69b7edbebebea31269f53d50274..e222d8943b66e2db1c7bfa845cd882039230d826 100644 --- a/model-00045-of-000163.safetensors +++ b/model-00045-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:938c7306ce56ae407005426e38a246a6ee5ebb9f941230da38d99493ea954831 -size 4302350808 +oid sha256:867c286983f1633248ad628074d591d1a75191c45786cc0610db447a5a48cdb7 +size 8598786704 diff --git a/model-00046-of-000163.safetensors b/model-00046-of-000163.safetensors index 8d5ad1a146e477a5017337c74ece1950305371d0..4000d42e6d79bffb7d5129753bf6f6e195face22 100644 --- a/model-00046-of-000163.safetensors +++ b/model-00046-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e13e11c8bacd5557df1e6f864e7e260283b6a9672f85afd1d97841b63db899b0 -size 4302384504 +oid sha256:9d1446557a2e5f6c93361788626ce0daf918c41c771125b75a08ea5a1953daca +size 8602554224 diff --git a/model-00047-of-000163.safetensors b/model-00047-of-000163.safetensors index 2db23955cb140841b113770699012aeb41792005..77565ab4fee4685421823313d717c4693727495e 100644 --- a/model-00047-of-000163.safetensors +++ b/model-00047-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3ae5dc07da78e72f3b8064b53d042081a64755e4dfd792ac13f1615d6f70a86a -size 4302384961 +oid sha256:bca76a65e27b91cc7f5eda783b6c8c9f064a5d260bf2747ef025d7df08e4f873 +size 8602554448 diff --git a/model-00048-of-000163.safetensors b/model-00048-of-000163.safetensors index e18609f7d2b98d72187c6e0fc220f821fec80d21..c82826e13bae1bb3a03c2b1f293df3573a900ea7 100644 --- a/model-00048-of-000163.safetensors +++ b/model-00048-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df85e837c8960a00205f57b27edb17278c18beda17ce1ed3acf482ed85076c6d -size 4302350620 +oid sha256:6a484c57aa9273db48ebf95f2d13ca8548188c1c8380abdd1811fe6a3d893177 +size 8598786616 diff --git a/model-00049-of-000163.safetensors b/model-00049-of-000163.safetensors index 6f12fbf7629854ee615fd4beee57819486f0c1ee..1330f673bd42db69fee8f3524afb146862f33102 100644 --- a/model-00049-of-000163.safetensors +++ b/model-00049-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:207e8af06dfc8b9b2a34554fa4ecc0ef0c6b87d12db7c9dc62eb15ee29f7491b -size 4302384692 +oid sha256:58532be8d29009451a3bb3e1bc5e29236c6e80f9650595a5dea6b12784ee0dd0 +size 8602554312 diff --git a/model-00050-of-000163.safetensors b/model-00050-of-000163.safetensors index 94d32a8a839163f57bfe94ab52885c6eaeeed1b8..855d80e67b2a1799462a19d1a7f4b22db5291bf8 100644 --- a/model-00050-of-000163.safetensors +++ b/model-00050-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7dfd5bcb9a53a0e9d3cdc2b897021c9abc75dfea2d3a8661ba8c38c0283ca7c7 -size 4302384963 +oid sha256:59b4009aedde11ca72dbf8763aa48523ee67bce482688c4650987bbda8a781af +size 8602554448 diff --git a/model-00051-of-000163.safetensors b/model-00051-of-000163.safetensors index 5a6811974a5ff72674b964e71d0e718bff92c22c..56c65b92a5f6f2528917111b7c2f7c79fa19cdb5 100644 --- a/model-00051-of-000163.safetensors +++ b/model-00051-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fe8ba090ec48bff17fe6aec44474d9d3aaa3d1900cc5b878c882bf15f32bd97c -size 4302350448 +oid sha256:484b03be0ebf2fc12fb97ae4382357b57ec43e80a17622c96f0c66abc2ec0ccc +size 8598786520 diff --git a/model-00052-of-000163.safetensors b/model-00052-of-000163.safetensors index 5726748b6b4d4869ae2904c64ac15c96220ffeae..30dc65c25fc4e80805d65262a579e4ef42edf194 100644 --- a/model-00052-of-000163.safetensors +++ b/model-00052-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03945249e7af5cf507e7941917f45a8dadcb3867c2ae9ab8f40197ca0b27335a -size 4302384884 +oid sha256:3fb5da4bf9365c4df89af0a867768ef16f6b1f1ba46594f04037085b911e7e5d +size 8602554408 diff --git a/model-00053-of-000163.safetensors b/model-00053-of-000163.safetensors index f638fc241a8adbb86008b77d8616b5306eca6029..e1c69641d915b1646007e1f46512e248b99b09c7 100644 --- a/model-00053-of-000163.safetensors +++ b/model-00053-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a764331dbf293390b1987f435a092148946cf95e7e4f784f3911d6130db71d0 -size 4302350824 +oid sha256:b60d4386d43ff3ea7852c85f9926da89950eeec8dbe28ad511063ca276739ea9 +size 8598786720 diff --git a/model-00054-of-000163.safetensors b/model-00054-of-000163.safetensors index d15382a8262f7d1ab4db6d158e98f455f58e39b2..50e751d65a3b0fb283dc58d8205a31ff91ea9b19 100644 --- a/model-00054-of-000163.safetensors +++ b/model-00054-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a13688518c528eb3f5728d32105b8e5fb8e3d6f513076309b27734faa150a908 -size 4302384488 +oid sha256:41d8805f5b2a0b45de2a7f1ce41a4d68d0a157fd811e4d8f09f4f73c810ea7b9 +size 8602554208 diff --git a/model-00055-of-000163.safetensors b/model-00055-of-000163.safetensors index 9e7bc0bb0e37af0b88b7e3082507f506f61ede8b..fd948a82428b901051de8fac9b50e05b4a840014 100644 --- a/model-00055-of-000163.safetensors +++ b/model-00055-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bb473f1ccda3b70c43e1cba1a55f54ce23d1e22ab855e03cbfa757021ec1f802 -size 4302384963 +oid sha256:fbe0e400217d2d80ca980433d6684230ca795fec3425fe0edc982f694af7a5e0 +size 8602554448 diff --git a/model-00056-of-000163.safetensors b/model-00056-of-000163.safetensors index 7f2fb88ab4f786c4cd189f48c6ae0b67471a5c85..8a286b7b0b8a27ca814264c7caf2cdb13087dd3c 100644 --- a/model-00056-of-000163.safetensors +++ b/model-00056-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:210545cb12fbfaa3f42ddc1ecddaf04ea209bcd539aa60626a8f2437aa267f2c -size 1747417474 +oid sha256:4fdd86f08f8ffafb7236c38e04775088378bea518af4d063ac07a3f43924c1ce +size 3493899088 diff --git a/model-00057-of-000163.safetensors b/model-00057-of-000163.safetensors index 0f571961fed1de0eb5bf86518b064cc4f9c0ac41..9c5c5f156ec2810a4e395894e6e24700e93be29c 100644 --- a/model-00057-of-000163.safetensors +++ b/model-00057-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3b35f6380a2582fe31ab19767525f63b00797e8d5c1171e31fcd8b9a5fca4748 -size 4302317817 +oid sha256:9fd1d954444702f042c6949b77d4e198ba2c8c415db5baf76cff9fcbd55895d4 +size 8598757608 diff --git a/model-00058-of-000163.safetensors b/model-00058-of-000163.safetensors index 8272980fb703b387338065fee4bc7cb850d7f68f..c9466faa4a34bc3b3f200a12d43c141b206422cd 100644 --- a/model-00058-of-000163.safetensors +++ b/model-00058-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:28d7ed16f5201e9c55c5ab8937d7303eef22a46e397a135947ef84d6e2d791aa -size 4302384914 +oid sha256:642cd14a735600af3d00c9b9187e9aaf2ad6b9174681193ddf270fe89ee2bfaa +size 8602554424 diff --git a/model-00059-of-000163.safetensors b/model-00059-of-000163.safetensors index bfebda022ab146c2b4a1fbfca71685b9c189cb36..451ec54f5401deed32caba79c3d144112b4ed96d 100644 --- a/model-00059-of-000163.safetensors +++ b/model-00059-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6edacb001b24def3874d7f03d97f18da56ef4b7937d81b65d6a15f3729098835 -size 4302350794 +oid sha256:0a8543b0ccc8cb73df1044e80b78d74beba2c233e2cca05989f0fd7e7e0fa42b +size 8598786704 diff --git a/model-00060-of-000163.safetensors b/model-00060-of-000163.safetensors index 176655b20c1767f7b70d23c9ec9950dcdfdf2be2..a693654a194020471d5b2ac1678f3ad967ed6b8c 100644 --- a/model-00060-of-000163.safetensors +++ b/model-00060-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fef1246c153b46c6382c1a7063fdf17c458d4e68d1abdac87b4fa3be0e0c046b -size 4302384518 +oid sha256:d4861e18bedec884d6191ae27386f4b3f2a0b52f6be57df991b1b9d0ad751fa9 +size 8602554224 diff --git a/model-00061-of-000163.safetensors b/model-00061-of-000163.safetensors index 59200c8811852ffc33aa2fed92ef2eb082ab382c..ac6d444de6babf327941f8cd92d03f128e20983c 100644 --- a/model-00061-of-000163.safetensors +++ b/model-00061-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f88ba0e9b666fb22e1ef50ec25ed382e35a943ffabe28f493eb81c00880f8541 -size 4302384963 +oid sha256:ddbd126b630a8cc954077706d1469ea2df8a5c11677ce336e3d30808b312431c +size 8602554448 diff --git a/model-00062-of-000163.safetensors b/model-00062-of-000163.safetensors index 6b1f034c62aa0cd8f1848ef0298b1ea807d72bc1..2c8f856ac3f8fac060780d4f40296dec10fef4a3 100644 --- a/model-00062-of-000163.safetensors +++ b/model-00062-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:009804d0502a2a2eb46e67cd852b8ab2f749503c2d54d851e12a8e45ad188a0e -size 4302350602 +oid sha256:8505a633d675e26469862fb4b490725c3b484350194368078480e79823b7e383 +size 8598786608 diff --git a/model-00063-of-000163.safetensors b/model-00063-of-000163.safetensors index 60ddb057d8dd967f324060981e540bbf46875afd..768102c6ef1122d42e556923c0ceaf967c6f6882 100644 --- a/model-00063-of-000163.safetensors +++ b/model-00063-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f762a03e4831cc65ba310336cb5101f2506e675bc13f05758e7fa453c1c50ba -size 4302384710 +oid sha256:c5dd301776f19c530c46d38b28746fd6b46ebdedb44094f9ba467db5add10387 +size 8602554320 diff --git a/model-00064-of-000163.safetensors b/model-00064-of-000163.safetensors index de7d1ddf17892cb829075a1e685a630913e340f5..b5c0ca1aa8a994a58a96295da322489fbba33e9d 100644 --- a/model-00064-of-000163.safetensors +++ b/model-00064-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cdbe9c409a1a6f6c2cc58a3598ef9fa2f182726c1597f2672272ce487ae26bb7 -size 4302384963 +oid sha256:31fa21080179721762ce4c568da7d7c49ea7aa76dc598ec7b1033da6011087fd +size 8602554448 diff --git a/model-00065-of-000163.safetensors b/model-00065-of-000163.safetensors index 40e8fc23ba4937c5bfe526566b1c464ab437dea4..b67a43c44a56204ca1a1027912daa8533ac65e7f 100644 --- a/model-00065-of-000163.safetensors +++ b/model-00065-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9849c2c30fa0dcc44efa55a45afe9ec65c683bb4c370bbca9d96eb9ae30e6126 -size 4302350432 +oid sha256:7ba6c10d38d6b3781d49b5396ae907b854fcec20b7b1966c0091eccff9702d73 +size 8598786504 diff --git a/model-00066-of-000163.safetensors b/model-00066-of-000163.safetensors index b13242e2a02d11d00a3ebb120168fdf0a4106267..081efc8d423b22b3e71f6423139a7f20a515e588 100644 --- a/model-00066-of-000163.safetensors +++ b/model-00066-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:88a3879e8d8928b7b2304246c5f31ecf7ab47ca11ec750b9adb66670f02f9067 -size 4302384900 +oid sha256:83e856db43bfb8aab0c9fa752c2ba89c95d3c4daf90fbfed872da2e8e164f26f +size 8602554416 diff --git a/model-00067-of-000163.safetensors b/model-00067-of-000163.safetensors index 5e091715a438b3bba6d9103f760ebf317b64f7b0..0d8fc1db3121401fc8e5c77dafa016d2499faa93 100644 --- a/model-00067-of-000163.safetensors +++ b/model-00067-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7d4c58f31a14cc0422b6fc983dfe776920a6dd7d5e43ff547b3ed98292274a9a -size 4302350808 +oid sha256:e5c723b79180ef12f2e1a82b1600d2e415dd966c9c4166ff07b46ebc1dee00fa +size 8598786704 diff --git a/model-00068-of-000163.safetensors b/model-00068-of-000163.safetensors index e47d81e93bc68046e4ff7f26fd8d9530bdbe0a98..73f1ec02dd192e0236490c6e644baf7a016c5a95 100644 --- a/model-00068-of-000163.safetensors +++ b/model-00068-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:910927c6e17d27e8622d8da37db6584c9942e9c2b9f20419305355591a2d3c7c -size 4302384504 +oid sha256:80b8e57578494d37fc163bed4a5b3b8ad03ba218a9d5f8af78610b1f8580ee47 +size 8602554224 diff --git a/model-00069-of-000163.safetensors b/model-00069-of-000163.safetensors index 995237b5c0a3e8265ecb40aca18249e7e4629ba1..ffd247c61e8cc9d05db42113be39f551e43ff251 100644 --- a/model-00069-of-000163.safetensors +++ b/model-00069-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bcfacce03108604b61fd2ae2fe4f6e445a04e0bd3334b6370b309badd2c8af76 -size 4302384961 +oid sha256:1eac93e819183abf53a2bca5b5e4a39ccd7368343f28d5103b7c98cd2832574d +size 8602554448 diff --git a/model-00070-of-000163.safetensors b/model-00070-of-000163.safetensors index 7c2c071163bad51317d5796cb9020e15bcee2446..430042a556d54e835896bd3067494d66aba5c329 100644 --- a/model-00070-of-000163.safetensors +++ b/model-00070-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:276a349ba4ce41d93421c016cea0d5efa6f162047c290737ffc2b184f382c952 -size 4302350620 +oid sha256:ce2107a2c3b62cf21cacc86b7997ad54f4f2b2764015fbf0649039c084a97454 +size 8598786616 diff --git a/model-00071-of-000163.safetensors b/model-00071-of-000163.safetensors index d8dd335084abaca82edccee59fa873704991d8a0..1d70d47e548313c445d21bf8dcb3eee2f6417d1a 100644 --- a/model-00071-of-000163.safetensors +++ b/model-00071-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c550537013ea699170cf938e5d579c2cc43c1d3abf4333978a1118b431c9d589 -size 4302384692 +oid sha256:b141897abcb5642b33b694f889c153faea38defcbb87a672ef30dc1dc684730c +size 8602554312 diff --git a/model-00072-of-000163.safetensors b/model-00072-of-000163.safetensors index ad199788b2d60a0df5604d4e470931dc13b63d22..3bf11d23e7f03b7baa95ce6ccc4c0cfc335e28af 100644 --- a/model-00072-of-000163.safetensors +++ b/model-00072-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:39f8920d14e948da0fff2c7ff38e56a7f2e9e546b335b28e94578512314e3700 -size 4302384963 +oid sha256:5d4d9ef4afb7873dfa001f71f6b44ffd2103bcf627a012d792185821be16c85e +size 8602554448 diff --git a/model-00073-of-000163.safetensors b/model-00073-of-000163.safetensors index 1b08ca4ef230c249b09e62fa0c36e29f832e7042..e424a65470a13f777b5eafca82ac32a4269ba868 100644 --- a/model-00073-of-000163.safetensors +++ b/model-00073-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:960e55ecc0624c4cca92659ef01270c5713092df9f8eb6b1240f81f4584dfad5 -size 4302350448 +oid sha256:bf89244d0c55300a2767306b424eff449e2a515b505b917f9599006a8cd83dbb +size 8598786520 diff --git a/model-00074-of-000163.safetensors b/model-00074-of-000163.safetensors index ffd0da93375105128741d6a087df744691326b5b..4ca7f0aa10cb05e1e526793b8f049503ca857988 100644 --- a/model-00074-of-000163.safetensors +++ b/model-00074-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3fcd1a5bf85dd5f4e7aec823e69ae65c0c586b9d70229b3e893b3dfae1d087bb -size 4302384884 +oid sha256:6c560e37ac4f6be3c9824741a94cd63bb65b2f00655e9467734fdd3b99bc5e35 +size 8602554408 diff --git a/model-00075-of-000163.safetensors b/model-00075-of-000163.safetensors index 54dfed52fdf9da1b59b517b922c46d850d2ae964..8a35714a51ee1f821f74976c446f68e81406418f 100644 --- a/model-00075-of-000163.safetensors +++ b/model-00075-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:66e03af200bf1902dd72a44b8b806ace9c03cf76b03f7fd34b227e5d1ad06273 -size 4302350824 +oid sha256:692fff8d4f97a5ebe7bcb2dd5b4f7375fc4595b041b1480c15defa73fd95d8fa +size 8598786720 diff --git a/model-00076-of-000163.safetensors b/model-00076-of-000163.safetensors index 68c43654e815d033785daf385dd07f74fcc5fa0d..4b8c4bb40300548ff046431632423ec1c8a6ff56 100644 --- a/model-00076-of-000163.safetensors +++ b/model-00076-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:43cfb5095eb8d00d043186d192efa09dc79cd4e7b8017deb00c7a4c00de9d82b -size 4302384488 +oid sha256:033523de996f2982a34ab48c66d8cc2e49bfbec8fa7eabb1f71b3366d7845bfa +size 8602554208 diff --git a/model-00077-of-000163.safetensors b/model-00077-of-000163.safetensors index c58210527228a3418802521dffd4f74673f7dbc6..9f7177da0134bfb33cba7cbd9b6ba8bba9b9d703 100644 --- a/model-00077-of-000163.safetensors +++ b/model-00077-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1411532f8eab4dec6efe251cfdf83e8367221062b90c209bb2e1353f92d40b27 -size 4302384963 +oid sha256:3400a940e5910e410faabf5448ffbb6d18d9f879834a9ba7d41510c4cd7b0f60 +size 8602554448 diff --git a/model-00078-of-000163.safetensors b/model-00078-of-000163.safetensors index bb1432f827c88c4600816362e3696367111003b6..4b4e1dc66f8515293fb6ee026a87e00ae36d66e8 100644 --- a/model-00078-of-000163.safetensors +++ b/model-00078-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8ad3219d64a3e9c7cb5ce15dba761f4c25bf15cd1f3a4f5d500abf19d0187c0 -size 1747417474 +oid sha256:836e8b550e788541ec5ffb6b32ac4bae99978ddbd2d6f8fbcde5806f4b1b8e46 +size 3493899088 diff --git a/model-00079-of-000163.safetensors b/model-00079-of-000163.safetensors index 458833c223b4ce11253ef4f3b74ceacf348e60a0..843a624026d6118b901ed2dbeae17d7ebd7b70e4 100644 --- a/model-00079-of-000163.safetensors +++ b/model-00079-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d74c9e9383be2f47b735a3fe604e98c3163e14a2492790a3f8b0e25af6181b1 -size 4302317817 +oid sha256:d51a3594ec79036244fca6d106de95d6303380b8acd1e3d79d34149145264d5d +size 8598757608 diff --git a/model-00080-of-000163.safetensors b/model-00080-of-000163.safetensors index dacd6580e0e92287f317d9fc1e2d91f86b74011f..5da161444f68d293bbc3b21da5cfc60f0c346acb 100644 --- a/model-00080-of-000163.safetensors +++ b/model-00080-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:edfb4c02a4a6486a8ce7c96115f4bf03151500cb4e6c9f56b0388357b6fe3547 -size 4302384914 +oid sha256:e21caf3b004f1d5bf52779d7b4226e97657223f2dd270a693325b7c43fcc2487 +size 8602554424 diff --git a/model-00081-of-000163.safetensors b/model-00081-of-000163.safetensors index 737f7d59a8f761878e27e4b65c50202a282f87f1..4bc4cd9266834b26456a0dca7b720d9591fb4394 100644 --- a/model-00081-of-000163.safetensors +++ b/model-00081-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b1e9d08aba3eb055a97cebdf4dfa03200bb06a4eb79fcb0943ad59a523b5844 -size 4302350794 +oid sha256:268fdb4e0a94d29a884081ae75cf4472adf80dd50cda8583192bee09e9984d68 +size 8598786704 diff --git a/model-00082-of-000163.safetensors b/model-00082-of-000163.safetensors index 0b3488b6bce3e48326cfa5b9e6eb503d04b12291..7594e623651ea97730ba3c310672a8c5a069756b 100644 --- a/model-00082-of-000163.safetensors +++ b/model-00082-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d8c4620641dd1b6cd48d42c9e9603adafd7b620146607dc731cb73a744df67aa -size 4302384518 +oid sha256:1b3b165c4f92446bbebdccf65d60aad4ff0bba3e884c1e016e5f27b98fb7af54 +size 8602554224 diff --git a/model-00083-of-000163.safetensors b/model-00083-of-000163.safetensors index a4e9a6715d7671021f191d634537e53678fd44ac..cf73eb2ba5aa2f8bedd426221e3f907c5a07a52a 100644 --- a/model-00083-of-000163.safetensors +++ b/model-00083-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c273f728b6c90fa4cb4d420ce030e4b07972a8bc52996a69deac47334d04b5e9 -size 4302384963 +oid sha256:09db84761d8e985cdd47d6366b798696c9ae54a478b21647b38845fea018272b +size 8602554448 diff --git a/model-00084-of-000163.safetensors b/model-00084-of-000163.safetensors index 9cdde822bbcbeea2ef746ddc9bd85d5d4423d381..7621ae100a7edbe1886088ce41ab715e44b2f933 100644 --- a/model-00084-of-000163.safetensors +++ b/model-00084-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:424e18ad35dfc53f392d60109f8cd5cbd420e94ebaf43e304be157215442f6b9 -size 4302350602 +oid sha256:46eb3c357ca882ec337412f7dbc6deef7914f2062ba72290d795eb5c8c22e765 +size 8598786608 diff --git a/model-00085-of-000163.safetensors b/model-00085-of-000163.safetensors index 2f1ffc40e2af7a43238663db7a4b60902263776e..0ca64f7909452c3914b888a83d99dd54dc44f67c 100644 --- a/model-00085-of-000163.safetensors +++ b/model-00085-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b1690a7567a686b355d1c810193b3ab0b5d82648bb93194e9043b30274d1d24b -size 4302384710 +oid sha256:a9e55ef86fe7535da527daeb5485fc689d7ca534afd87d484a2dd2bb00053e80 +size 8602554320 diff --git a/model-00086-of-000163.safetensors b/model-00086-of-000163.safetensors index 22ff9217031000ffa90edc5a9bdfee65afef07b9..61a47e6bd52e4836c0529761e00a5e6d88f900d8 100644 --- a/model-00086-of-000163.safetensors +++ b/model-00086-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e65eb5913f33530c02b142f215de8e0583b1392aa242c5681fc99a2f32a0243f -size 4302384963 +oid sha256:bb760c9de5041dd50b917d1b04fca66d5e61208b367d6798ad9d9d78f831dc5d +size 8602554448 diff --git a/model-00087-of-000163.safetensors b/model-00087-of-000163.safetensors index 5a28e3df9083f4e2a6eb564a026a6e2c085dda87..2106b8edd2f53fcccffab739bae1590373c2a4c5 100644 --- a/model-00087-of-000163.safetensors +++ b/model-00087-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2dc4e3d4751f687a087547faab88658d83c5e164337dee28858f3f2c0242c0d9 -size 4302350432 +oid sha256:eff7f7a94c69b698c531f72dcef52e0c8e1da7d552b259d111977793f470a631 +size 8598786504 diff --git a/model-00088-of-000163.safetensors b/model-00088-of-000163.safetensors index 2dc66424f03ea34a061c11077095135898b82c40..e5f01661c275723c735aca8c9d1b136b706ce8c6 100644 --- a/model-00088-of-000163.safetensors +++ b/model-00088-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:54940d6614221461f951080d2fcf34b85e9bf325138903588e1fd4ac964963ff -size 4302384900 +oid sha256:32bfbd43255e0c0e89085b98515587ec832267dd78105c2bbfe5e158efb862f8 +size 8602554416 diff --git a/model-00089-of-000163.safetensors b/model-00089-of-000163.safetensors index 3b038f7c736b2f4d8384b7e094f96343be6439d7..2dd228eb609ed266f2ba71597288bdf69918753f 100644 --- a/model-00089-of-000163.safetensors +++ b/model-00089-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:38e2520475fd10ab74587d481f0e0fe71909f428a1118e132b4a6600a9f68407 -size 4302350808 +oid sha256:594549ec17c1c115fb616b8006b9dfa126993f6936860ec4cf290e36c130f9fa +size 8598786704 diff --git a/model-00090-of-000163.safetensors b/model-00090-of-000163.safetensors index 858423fdc990be035ad7259f08628cb44a2ff620..3ee1df08273bb6257b7b7fa4ea9a047557081285 100644 --- a/model-00090-of-000163.safetensors +++ b/model-00090-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ee933f59ddd234abc6d13968e04d00f824508fab76749b813a69fe8239356246 -size 4302384504 +oid sha256:af137cf1f8cca460b3642a839503e465883aff451fe7fd2fadb6e8a579e9185e +size 8602554224 diff --git a/model-00091-of-000163.safetensors b/model-00091-of-000163.safetensors index 30063dff25829c44b0586c7e7c5a04c8455de452..672318334e6298f7cbbb590b61faf945da026e39 100644 --- a/model-00091-of-000163.safetensors +++ b/model-00091-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4bacfdad2f2cf0230ab890e88de8a39082986edd10a9feb67be1ed086683a8d0 -size 4302384961 +oid sha256:29492ca4644102ed8c38a512b23babfe5e58d6b08426d6e55e5efb2fa232d7e3 +size 8602554448 diff --git a/model-00092-of-000163.safetensors b/model-00092-of-000163.safetensors index 1635e07222a547e13d439c165546e7559b2565bd..aef9ef7d998a201597bb955c60d0be5c4f8ecadd 100644 --- a/model-00092-of-000163.safetensors +++ b/model-00092-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:74fd6b1a280b6e8cb8560dafee0fff8955b311aa43cc15c42f96269350066cb8 -size 4302350620 +oid sha256:698d5cfb4b1043abb951fbc5450706e33a0d2da53baa19c0625da2f85470df35 +size 8598786616 diff --git a/model-00093-of-000163.safetensors b/model-00093-of-000163.safetensors index 017f6fd0df068d8a74237916b4e0f2fb6a565e86..187177cae6e64e9c046f548dca2d432831c83e70 100644 --- a/model-00093-of-000163.safetensors +++ b/model-00093-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:714adb4ffc41739e67d7913131f3f2cdcf2d2eaae6fe08b51f312cd38a33099e -size 4302384692 +oid sha256:e9049e18a0a8a65a03687e40749161cfe4b74874494ad474dc2dfd7457fd110d +size 8602554312 diff --git a/model-00094-of-000163.safetensors b/model-00094-of-000163.safetensors index 2d785fdb7885dbb364f3fb1715d491eb1452f5f1..1cb22cb8019e5f5946bf76200dd62d0d94506d85 100644 --- a/model-00094-of-000163.safetensors +++ b/model-00094-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3bcdaa226ac620afc7cb51d4f7b3ff1043ed5697b60349af85e2830607a8693 -size 4302384963 +oid sha256:3b7dea3ac82289d7c805a708d5579d301c8d0068c1e05dbeb47535564fb9f4fb +size 8602554448 diff --git a/model-00095-of-000163.safetensors b/model-00095-of-000163.safetensors index dbbcc1509cfb883c1a2e355dba9092eefd3df3ed..ab0698b12f84a6965962b82ea1ca79d21cf9ef7b 100644 --- a/model-00095-of-000163.safetensors +++ b/model-00095-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1e0ad4783bf46b8698c650ba08713e1a9077e2894bcc039f703c5ac4a0a2a1f1 -size 4302350448 +oid sha256:f9273f1a3a4d1b24d5be1749f95f3f286832109362ed78df3903db865d694670 +size 8598786520 diff --git a/model-00096-of-000163.safetensors b/model-00096-of-000163.safetensors index 7c3d0b1c48591f57c25e7a609c0407addafe6aaf..83538e866e2043c5c00334cbacab1b7b99c9c1ee 100644 --- a/model-00096-of-000163.safetensors +++ b/model-00096-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dac3287c0ab7d0c4e33d7acb78c5e472fcaae3bc8f952337d4e7d898142a13cd -size 4302384884 +oid sha256:1b939b1649e74279090c8e9c2b3a4baffa60e55372fa628b246ddf36f484de81 +size 8602554408 diff --git a/model-00097-of-000163.safetensors b/model-00097-of-000163.safetensors index 9a563e1c3ee6a513cb494c3b66c4f055afacb949..2e5a264c5adcc873c91f0578de67456b580d4210 100644 --- a/model-00097-of-000163.safetensors +++ b/model-00097-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17bd26dc53c5f3855432b6169324cc30ce4c6fbb1ffa045a690774e92cb18a3e -size 4302350824 +oid sha256:b1ee6840bb4ae390869954c4abe97030a163b6479985344dc723ff957a6ac2af +size 8598786720 diff --git a/model-00098-of-000163.safetensors b/model-00098-of-000163.safetensors index 8cb6f0d06f07eb9415558008ab96aedd9eb34769..9763363ae7bf3be401f365c7a2c26996e65a9671 100644 --- a/model-00098-of-000163.safetensors +++ b/model-00098-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0c1ccb0c95ec399cab9920c9ffe4206f684819a8ecbe69ab7316e3619fa14c90 -size 4302384488 +oid sha256:35102e570ed4de1f0660d5d6bfb8c367de2e2128e810f490b4ab84725f9e72c9 +size 8602554208 diff --git a/model-00099-of-000163.safetensors b/model-00099-of-000163.safetensors index a337010b32dfb2bb896fe9f5fe40b3f2d1dc8a5c..6db9194ac961ebd4551e94e3233c2e16903e4894 100644 --- a/model-00099-of-000163.safetensors +++ b/model-00099-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aa3fe3e6fb2e54f9540d62fae524a3986ac0bdbde8caa89057b691bb47f43606 -size 4302384963 +oid sha256:4c33ab4239693ecc54eb57bc188e1dcbd7dbe0db6e5bae1e61bfc1080bd392f9 +size 8602554448 diff --git a/model-00100-of-000163.safetensors b/model-00100-of-000163.safetensors index 632d46315ab07d68d75e127355a816523540a189..69dfaacc0ad284886ec8f299a128ce2bcdc67425 100644 --- a/model-00100-of-000163.safetensors +++ b/model-00100-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:300556119da43604b27f63ef8cf38d9805fdfa7014648b41583a01d13da44039 -size 1747417474 +oid sha256:cb6963e86fd900a84f4987feca7526361bb2e714e1ad1c428ebf9f1086722b78 +size 3493899088 diff --git a/model-00101-of-000163.safetensors b/model-00101-of-000163.safetensors index 7b1ffbf699ff1d5fc667ac2b13eb787cadc25a9c..db1cd619158b173d8a9affbc9bd6afc2dfad10fc 100644 --- a/model-00101-of-000163.safetensors +++ b/model-00101-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3c4705db6287dd9eeca891c6ef8ab18fa8c1b7a4b15b30f7a789174affe02bf -size 4302317817 +oid sha256:928b263d92524520fa26dfd0b326b722eb43f333e513d61851207c039cdd413c +size 8598757608 diff --git a/model-00102-of-000163.safetensors b/model-00102-of-000163.safetensors index b6e8648b7a79021e7771dd52d13d31da9f6f07bd..04964eb27bf5a22c94b37cbcafa4f61181de5c85 100644 --- a/model-00102-of-000163.safetensors +++ b/model-00102-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:945d2f833dfcdfb0fe99c97e3c5eb62ee1c53f5afed771e403e24ffa000118bb -size 4302384914 +oid sha256:730fcb83aa49dffd318543a55c4cdf8a1efacb3860e7ee6ade0344460ced2b59 +size 8602554424 diff --git a/model-00103-of-000163.safetensors b/model-00103-of-000163.safetensors index f424cc05835c8ddb9c8fd990caf042e2ab320fb2..113262185540bea6406b7932f6f6e7978a275b49 100644 --- a/model-00103-of-000163.safetensors +++ b/model-00103-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db5d341e101aa225d0f34d907e94b58df727f555fa527806f5c8769e85d89186 -size 4302350794 +oid sha256:adc5c0d711e7e6c87f6dfc65872bfe897547ce21ed1bb96b8b5daad32becb2a3 +size 8598786704 diff --git a/model-00104-of-000163.safetensors b/model-00104-of-000163.safetensors index 5daeb6f59dcef7649c5d93bde7e63933945d6f92..708ef618c8b48ee1d2a9b8b561187b9d37bc2404 100644 --- a/model-00104-of-000163.safetensors +++ b/model-00104-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d77661790144797227dcee08148e4b90acf72875eedd391088f27a4c24e9156 -size 4302384518 +oid sha256:b653d66c811b7e851cb36afdfa39d77f353df1ec41e9a3d529bc8596ea64ddf4 +size 8602554224 diff --git a/model-00105-of-000163.safetensors b/model-00105-of-000163.safetensors index b6423e2d2197541b3f590f633a05c322291b3484..12abdb39d7f0853018858862a5293a58c1d1b6e0 100644 --- a/model-00105-of-000163.safetensors +++ b/model-00105-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f1466e6a5fd872423c7ea902903142e9b6abb0d3d4c2aba311101e905636df88 -size 4302384963 +oid sha256:065f702fc487c7e31436f59168c740551d7bddfa0869d1a6fa43afa782c8d37e +size 8602554448 diff --git a/model-00106-of-000163.safetensors b/model-00106-of-000163.safetensors index cc5fa77f17f45d06099f52fa32f7567e4b0ba78d..d23a912bac46cb328ec420644c616df8a27efeb1 100644 --- a/model-00106-of-000163.safetensors +++ b/model-00106-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84f318ee430b731ebe2722e026413e8f70002af2fbee5f60003647fa47b20518 -size 4302350602 +oid sha256:a09deb76871c8369848a0b18ecbe8a064aa9e100ffa43dec0a36a2021aa69e73 +size 8598786608 diff --git a/model-00107-of-000163.safetensors b/model-00107-of-000163.safetensors index 6db4806bb084c05b9d8f4d4bbc9bb1b033879ff4..44fbe58340c3915f03547f2885f36fbe7196e13e 100644 --- a/model-00107-of-000163.safetensors +++ b/model-00107-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b37a206419d5a14b2212085e075997662a922338c95404128bd40d5ba6ce090 -size 4302384710 +oid sha256:a758c0bd7c4930765ee695bf31d5a8ff43d8bf9ac46192f34e6372e37a302a44 +size 8602554320 diff --git a/model-00108-of-000163.safetensors b/model-00108-of-000163.safetensors index 669e9311a088652dd0bfaf6015df5db6138505c7..dd01c79d8c7677764447030c5410f529e05fda01 100644 --- a/model-00108-of-000163.safetensors +++ b/model-00108-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b6e4d2332183e0fa8d72ac930551038bb8c971a1a7b38abf80211ddc32cc341 -size 4302384963 +oid sha256:9e9c2fac7b6df5b4d3d34bcb793741086b62c31f857b915ac32eab689a46433e +size 8602554448 diff --git a/model-00109-of-000163.safetensors b/model-00109-of-000163.safetensors index e3fb7ea38dff034a2505d6c20e4648a58058e868..06880a431bcfd11ce3c4cf0941a1ad385e8eed77 100644 --- a/model-00109-of-000163.safetensors +++ b/model-00109-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4d67e9fd9d13f05bb9613434b4090408eb203b4d985aec0e2ea9ef489928fe25 -size 4302350432 +oid sha256:d4c6ba178de822b0844ef5c8b2b6d524d44c96f549bab95a05049adb0add54db +size 8598786504 diff --git a/model-00110-of-000163.safetensors b/model-00110-of-000163.safetensors index 500d4de13d2368019b721a0c260bd7bde2cac3c7..1483c8ffff6020071d3ebc0a6f539b52e2a39d26 100644 --- a/model-00110-of-000163.safetensors +++ b/model-00110-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5a42f528fabf1a31f3723a9d26f9bbe4e6de2af520f2894f23316ee0f6856464 -size 4302384900 +oid sha256:05cc592517d8b0b7dc436a6b8c0b754db466368b91ed392e8c3e608fbe721aeb +size 8602554416 diff --git a/model-00111-of-000163.safetensors b/model-00111-of-000163.safetensors index 188635c629ecbe544201e4584ef316d9d3c45d10..52fa612cc6cee8a7a1345e6114c61e49a85f91dd 100644 --- a/model-00111-of-000163.safetensors +++ b/model-00111-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1eff3d3853efd53477d2cc40a23bb7b0a156056fd94fdb32fe6ee0e5949349b7 -size 4302350808 +oid sha256:693317186a4b52c0c5138da8ce6a647fae81e29aacc37c436122eea7cf0737f2 +size 8598786704 diff --git a/model-00112-of-000163.safetensors b/model-00112-of-000163.safetensors index 467913e0f1cf41c7a92805b9042ebbbbdf38d390..d57f46bf7e61acf862813b759ea8ffa06f4a0be5 100644 --- a/model-00112-of-000163.safetensors +++ b/model-00112-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0fe9b6e8662d8c8fa2b1dd80093e028ea2dc3c892ec78d782a34bd790c7b3eb2 -size 4302384504 +oid sha256:166f049112924ff6e0aa8140918facd59a1e7fd02bda26fc9ae1d2e9a05dc8a8 +size 8602554224 diff --git a/model-00113-of-000163.safetensors b/model-00113-of-000163.safetensors index 18cdc6635473cc5268b1b5fa3fecfcee54d6c699..02ea3bda4f917029fce3c0910d94fcab9043637f 100644 --- a/model-00113-of-000163.safetensors +++ b/model-00113-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8c1b3e7e97cb12408da630027eb04ebae01a3f633a504b5857234909da755727 -size 4302384961 +oid sha256:effffc667d242969d444fdc6e813b1ca704f7c228605a88a967bbc82953697f5 +size 8602554448 diff --git a/model-00116-of-000163.safetensors b/model-00116-of-000163.safetensors index bf4f96f4c651b6a8baffd79f3302c0dc9ef49d34..fad1154e401bddbb392fba6d6060fd142bc9dc70 100644 --- a/model-00116-of-000163.safetensors +++ b/model-00116-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e933d3d9c42febc9a58abb187827fa2a511795528e7f7dfb2a5a8fcaee908a5 -size 4302384963 +oid sha256:5fc53268af228cf1cdb056ec7881d95298c89fe4ea84559e5ac9356461a2b7a1 +size 8602554448 diff --git a/model-00118-of-000163.safetensors b/model-00118-of-000163.safetensors index dc69bca4b2de1707b83d9da68e3ce8284545b999..2d4805e9bb1c728c3726a39e9fce4951f50dccff 100644 --- a/model-00118-of-000163.safetensors +++ b/model-00118-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8e27a9cb1d1c2490f6fc903fe3f4e164990ed08941c246c935bc4c35215ac1a3 -size 4302384884 +oid sha256:0ac618b9c28cb85ffb68757bfa6e8b81b82fcae96ad6ad36133f15ee31ecca99 +size 8602554408 diff --git a/model-00122-of-000163.safetensors b/model-00122-of-000163.safetensors index 1033294ebed8c9354e1be60ad95cba8d0685aeec..0743df33ee47a850bded8a636bd5afa5dbcff127 100644 --- a/model-00122-of-000163.safetensors +++ b/model-00122-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7337345a219a07647eb751e18d0f250627dfe186cbf43c576e2c2b93aa448bf0 -size 1747417474 +oid sha256:85e9e443d9adc3c25eeed1d136646a77d6f1b9abac5142338d34928514e07bb4 +size 3493899088 diff --git a/model-00123-of-000163.safetensors b/model-00123-of-000163.safetensors index a53a42bebee35160540017c38a8fb75a48fee2e0..d3e567bdd07368657c8f4ff4ecf71e2504d0c848 100644 --- a/model-00123-of-000163.safetensors +++ b/model-00123-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d50d3129ef6f4f80f89498f0ba426c373fda04a204a40d90a603e1e950734653 -size 4302317817 +oid sha256:00123b9d32302b36ce51804d43d21d4b5d92e30f4746b04c0d2f6f71f0d0e3f0 +size 8598757608 diff --git a/model-00124-of-000163.safetensors b/model-00124-of-000163.safetensors index 14804a7166003be0f0243ad65cae5df037503fe1..7129876b3938211eae41616b039e8bdcfe2a93ec 100644 --- a/model-00124-of-000163.safetensors +++ b/model-00124-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6f207cfa394faf3ab78abc9eaa30109bc8d56b2bd7c0b7d96ce11d8271758cbb -size 4302384914 +oid sha256:4d98f426ac234d180c2e8cbc7c3ccf8a2762e78bf1e4d39474cc5fe147b56d5e +size 8602554424 diff --git a/model-00126-of-000163.safetensors b/model-00126-of-000163.safetensors index e39fee183ddc8da741363acb6317fdc258fd1546..65edb62d14651aeb136d8c483d92d80aee2bf396 100644 --- a/model-00126-of-000163.safetensors +++ b/model-00126-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f6ba5a5471da07f597497d6caf7fee6b8056a501b3e6da55ff3dd1c9ad63e6b -size 4302384518 +oid sha256:880b53640cf8b75da9b828b93c373e63e6b613f491e940a15afd39d25f030fc0 +size 8602554224 diff --git a/model-00131-of-000163.safetensors b/model-00131-of-000163.safetensors index 54a5083fc12a09de3f4623b28db83cc012e6a80e..1114bcd10670ead8e589bfd3c2ed2fa9bef56dac 100644 --- a/model-00131-of-000163.safetensors +++ b/model-00131-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0199456e2b1a8de161b4ede2f61b41a639486da4a250194f6b7b83f662f931d2 -size 4302350432 +oid sha256:0e2e44df80ba461143aa992e33b1b07662650c5a81ce3e9f73c4045272c906d4 +size 8598786504 diff --git a/model-00134-of-000163.safetensors b/model-00134-of-000163.safetensors index 7b5dfac2f531c81d27a0755e022bef5ae1c4eeaa..24a49a344e549bf98753b5e95e257f7db6c8f5f2 100644 --- a/model-00134-of-000163.safetensors +++ b/model-00134-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1b3b36d497b9e23b9a4a3626164384639e776dd79acdec24d687d0e129074b07 -size 4302384504 +oid sha256:e888344a564ac24700d6b4fb1d7e42aabdffd309847cafc908bf74e7b39e2fda +size 8602554224 diff --git a/model-00141-of-000163.safetensors b/model-00141-of-000163.safetensors index b70a8e0ec7ddd6d776439c1a525c6a422bdea2b1..c4b97d336893fbe701cb50ea836008f95e00549e 100644 --- a/model-00141-of-000163.safetensors +++ b/model-00141-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dd1c282ddba12c984f18b60915516af5ef1de35521b3165b1991c121d7861288 -size 3142388798 +oid sha256:fd97d1767f887dc24aeeae4aba07b111d64cd4294ea7ad9940764b0f1cca7971 +size 6283123256 diff --git a/model-00144-of-000163.safetensors b/model-00144-of-000163.safetensors index 61a27045f8fde34cbf53be9e10a50477de380b4a..34ae1ba51641a9b845b88c11e86a0ce3b54dae55 100644 --- a/model-00144-of-000163.safetensors +++ b/model-00144-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b76fd57f1662890c904313d4d448254d864d8b5325ae76ab21ba6b4f50fa0278 -size 4302350794 +oid sha256:d06e5c4114338ace0d1b2118d0893afce58b1da40b830de5bf33e2dc71653af7 +size 8598786704 diff --git a/model-00146-of-000163.safetensors b/model-00146-of-000163.safetensors index 7de194e64232ab4137926bfa51188d5f94241da8..b3758b47ecf7244d80034ba9e1fdb39117e4c1ad 100644 --- a/model-00146-of-000163.safetensors +++ b/model-00146-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:981ed532393ecf1a2120f6af638a9458662f4d6e2d3183e263ea97a0b3bf47bd -size 4302384963 +oid sha256:cd26d981cf45884d305afca916e1ee10c28978113436f4b183d9928d9ab3ccca +size 8602554448 diff --git a/model-00148-of-000163.safetensors b/model-00148-of-000163.safetensors index 1ca8f4ba9d126febaf758d18ebeb23ebc4112179..e74341f71d070d2864953a1e6aa57549be792822 100644 --- a/model-00148-of-000163.safetensors +++ b/model-00148-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b47933264ddc95aaa64e328826a286612996259e8a84e67d5793d85e3a5189a -size 4302384710 +oid sha256:22bc8c994b5574072e40b30937d38d7028726abde67e24b5b2f13901d65110c6 +size 8602554320 diff --git a/model-00149-of-000163.safetensors b/model-00149-of-000163.safetensors index 004b013f5eb1136cbc6e5de8c6a1664b4a4ac60d..572724ca1b3c179eca22f62c487ccdc9ed255646 100644 --- a/model-00149-of-000163.safetensors +++ b/model-00149-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:22a2f518d7bc6803e4dd0c652b6023b3831d68632a0caae6d9c792efbcf3f547 -size 4302384963 +oid sha256:65facc6a621d82a2af92e03d0635dfc7d1affc501fece14af394be58b8fb9de8 +size 8602554448 diff --git a/model-00150-of-000163.safetensors b/model-00150-of-000163.safetensors index ff614dbd1dba241ebabad1cadfdb1ea5ed58338d..8be0f239c0c25fc65df777450b75fac3256e5f81 100644 --- a/model-00150-of-000163.safetensors +++ b/model-00150-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4b4ca747261d55cb526afc6d8298b26b333b9738eb16cfee4fcf09e70970145b -size 4302350432 +oid sha256:5d3df7be3bf159f6c31a86e34b2115d0044e3391301f1fbc5e641285f2d5293e +size 8598786504 diff --git a/model-00152-of-000163.safetensors b/model-00152-of-000163.safetensors index dbcfaa9bd698bd3a19c9f109c4c6ada485f69f9d..025bb79872e6978e0ea9ecd47df28de51600155f 100644 --- a/model-00152-of-000163.safetensors +++ b/model-00152-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e6adb0bb80711fecb36417763b4c4be2302b26beb1abc42e1b90cdf6db822fb8 -size 4302350808 +oid sha256:70587dcd6fdae5681fcba0d0aa19ddaf175d3feef2d5c3e47b8f8e6fab0e7167 +size 8598786704 diff --git a/model-00153-of-000163.safetensors b/model-00153-of-000163.safetensors index 9468f958a3fd57ef1583257377e6f4815e927c69..a47bf37b226a61f0bc5f0e04309afee40e0ff8f5 100644 --- a/model-00153-of-000163.safetensors +++ b/model-00153-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fe3867b4e2463f48999878c93510838515661358384e20f85f5f64babbe1164c -size 4302384504 +oid sha256:e13964da608a929d25f7d0a6b5b850d1221d446f6bf58bea00a23ceaf77bd192 +size 8602554224 diff --git a/model-00154-of-000163.safetensors b/model-00154-of-000163.safetensors index 03f256d4af8039d49bc8c5931983caccccf494be..0e0b92e20659acefb2b97cb0c986e74ade132a09 100644 --- a/model-00154-of-000163.safetensors +++ b/model-00154-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:78fdc257544f6dff8b35bf9b79ad2a6e01355767ddbb472138139ab9305c90f6 -size 4302384961 +oid sha256:7aeb9c130a2ff2d15bce05cd3318b095d2ad604258d3b5bae28437d594dc8dc1 +size 8602554448 diff --git a/model-00155-of-000163.safetensors b/model-00155-of-000163.safetensors index cc616ab4adefbfb74372c4c3c139c678cb213f4c..c4bd0ac036d805f7dc4876321328a1cffe610c03 100644 --- a/model-00155-of-000163.safetensors +++ b/model-00155-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:834632439e8855bdae240382455809b650c470f25984d1b9f10774b3a6a57162 -size 4302350620 +oid sha256:962ca7aaf44448e5365a8e918a9eae9b69be92968db82114643fba11f7b5d023 +size 8598786616 diff --git a/model-00156-of-000163.safetensors b/model-00156-of-000163.safetensors index 66b458193214a17271e68527c5edcfc7001b9108..641a34561df699423abb85993a27b04219c22f5a 100644 --- a/model-00156-of-000163.safetensors +++ b/model-00156-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4beb34c5173fee4ca8abb6136160c10877842134f11232b5f414ce27dabff174 -size 4302384692 +oid sha256:31393ee79e481493b72b3f23f5ca4fd90d1180cab0b105fab4de681106cca888 +size 8602554312 diff --git a/model-00157-of-000163.safetensors b/model-00157-of-000163.safetensors index 97ddaae573e9b451584cec2a485d3e1f9cfa796a..e246e74b071c3996700aea1cf9b63ff8739b56d5 100644 --- a/model-00157-of-000163.safetensors +++ b/model-00157-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c313d28a29f8096e2e7ae1ebf2c0656e9c2ca49a85ddd74632aee7a00b53b765 -size 4302384963 +oid sha256:af61ad2dc4c87cd59d4b3668cf8d68979512d4ef5aab3104da7b6118a14a9c00 +size 8602554448 diff --git a/model-00158-of-000163.safetensors b/model-00158-of-000163.safetensors index 0fd3f77323bb4cc20982f098f81b76e70ac2f8ad..fc7d4668c8d64736496414100cd825d52117b7a0 100644 --- a/model-00158-of-000163.safetensors +++ b/model-00158-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f0448fba1ddb4f7fb75caa110cc1ea488767a8c4ffb7745417ee6345b34e842b -size 4302350448 +oid sha256:2d2f56a2513e7cb200fed07531addfb881a488bd5e3b2e661d7c28830277b056 +size 8598786520 diff --git a/model-00159-of-000163.safetensors b/model-00159-of-000163.safetensors index 8e179cfc329a7d72c5fc6b8bec0ebdcc5779f9cd..ac9763a114122652ec7c57e9344c58d9ed845412 100644 --- a/model-00159-of-000163.safetensors +++ b/model-00159-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77a6ec3076e549816a5f39f87c0369c539c2c1e066675b3f53b5e0f485ba5507 -size 4302384884 +oid sha256:aa7d802110c9bcb6303b2bc8e77afa6a31f196b534eb9df63d1e58f17503797c +size 8602554408 diff --git a/model-00160-of-000163.safetensors b/model-00160-of-000163.safetensors index 6961183d17e10097a1f102a1b40b8a75ec00cbc4..4192f237548ec1884ba5c30f39393192f3d9a541 100644 --- a/model-00160-of-000163.safetensors +++ b/model-00160-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f621991fbc9ce0a4e2d4a7348f3575185197335a7cb24b0aeb4941ddfcebd54e -size 5230637362 +oid sha256:6c8a932ce49bba0f5489f30a13708532cb8bc727667dd76ac60a4371377095ef +size 8602463472 diff --git a/model-00161-of-000163.safetensors b/model-00161-of-000163.safetensors index b02f18b70444cb73942a60c6134b0b875079b441..b23307755a9457a4a9914a78854a60831ae86ee4 100644 --- a/model-00161-of-000163.safetensors +++ b/model-00161-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e1e75d7f80863220bb695da847bf3c7946f6646736bda827244bbaeb65776b27 -size 4302384321 +oid sha256:b65a6d2704cdc7c20c5e7824e8c0461e68adecc97977b437a00d5d77b8424d24 +size 8602554128 diff --git a/model-00162-of-000163.safetensors b/model-00162-of-000163.safetensors index 95040aacec425300ce2d2ea77e41d32edc21a011..969df4465d0ae93b80862cade1c9ddf9a744469c 100644 --- a/model-00162-of-000163.safetensors +++ b/model-00162-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:53e717e22e28af1012bbc5c57e28ffa4e6ca8bec2a4e21d91955c25a830f2464 -size 4302384948 +oid sha256:0f8c12d03556374bdbc47ada0c4e7d299a4615dbd2d74da07218ac55b35a76e6 +size 8602554440 diff --git a/model-00163-of-000163.safetensors b/model-00163-of-000163.safetensors index 5b8b1c7e4d1877f16cba58b5df24fb38d2a1a3c1..123294428c1603b579b958ce202aebcfed7adbd5 100644 --- a/model-00163-of-000163.safetensors +++ b/model-00163-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:913177d9e0dfb228769e0a13a386c34b919dcbb32a430ce230979f53bf7ae5bc -size 6584784447 +oid sha256:8bc6106794d6f881eae142a1de5ef073ce0beb3204a4722de547dd72d606bd42 +size 9255875920 diff --git a/model.safetensors.index.json b/model.safetensors.index.json index 210ab5c5ca880ad0003c3b0ea876eb05f3215136..5b60276c1efb766f6a1aee2e357e27407f6ed12b 100644 --- a/model.safetensors.index.json +++ b/model.safetensors.index.json @@ -1,91991 +1,46181 @@ { - "metadata": { - "total_size": 1369062772000 - }, + "metadata": {}, "weight_map": { "model.embed_tokens.weight": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.mlp.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.mlp.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.input_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.0.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.mlp.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.mlp.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.input_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.mlp.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.mlp.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.input_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.gate.weight": "model-00001-of-000163.safetensors", "model.layers.3.mlp.gate.e_score_correction_bias": "model-00001-of-000163.safetensors", "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.shared_experts.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.shared_experts.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.0.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.0.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.0.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.1.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.1.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.1.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.2.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.2.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.2.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.3.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.3.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.3.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.4.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.4.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.4.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.5.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.5.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.5.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.6.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.6.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.6.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.7.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.7.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.7.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.8.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.8.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.8.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.9.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.9.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.9.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.10.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.10.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.10.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.11.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.11.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.11.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.12.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.12.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.12.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.13.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.13.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.13.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.14.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.14.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.14.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.15.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.15.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.15.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.16.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.16.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.16.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.17.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.17.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.17.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.18.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.18.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.18.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.19.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.19.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.19.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.20.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.20.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.20.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.21.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.21.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.21.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.22.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.22.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.22.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.23.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.23.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.23.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.24.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.24.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.24.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.25.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.25.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.25.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.26.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.26.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.26.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.26.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.27.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.27.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.27.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.27.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.28.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.28.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.28.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.28.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.29.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.29.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.29.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.29.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.30.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.30.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.30.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.30.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.31.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.31.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.31.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.31.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.32.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.32.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.32.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.33.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.33.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.33.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.34.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.34.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.34.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.35.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.35.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.35.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.36.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.36.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.36.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.37.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.37.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.37.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.38.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.38.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.38.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.39.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.39.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.39.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.40.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.40.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.40.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.41.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.41.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.41.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.42.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.42.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.42.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.43.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.43.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.43.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.44.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.44.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.44.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.45.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.45.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.45.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.46.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.46.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.46.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.47.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.47.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.47.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.48.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.48.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.48.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.49.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.49.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.49.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.50.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.50.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.50.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.51.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.51.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.51.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.52.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.52.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.52.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.53.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.53.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.53.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.54.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.54.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.54.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.55.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.55.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.55.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.56.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.56.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.56.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.57.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.57.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.57.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.58.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.58.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.58.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.59.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.59.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.59.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.60.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.60.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.60.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.61.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.61.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.61.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.62.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.62.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.62.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.63.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.63.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.63.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.64.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.64.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.64.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.65.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.65.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.65.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.66.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.66.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.66.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.67.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.67.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.67.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.68.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.68.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.68.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.69.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.69.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.69.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.70.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.70.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.70.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.71.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.71.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.71.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.72.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.72.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.72.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.73.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.73.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.73.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.74.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.74.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.74.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.75.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.75.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.75.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.76.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.76.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.76.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.77.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.77.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.77.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.78.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.78.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.78.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.79.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.79.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.79.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.80.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.80.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.80.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.81.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.81.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.81.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.82.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.82.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.82.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.83.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.83.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.83.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.84.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.84.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.84.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.85.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.85.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.85.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.86.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.86.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.86.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.87.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.87.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.87.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.88.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.88.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.88.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.89.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.89.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.89.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.90.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.90.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.90.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.91.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.91.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.91.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.92.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.92.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.92.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.93.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.93.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.93.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.94.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.94.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.94.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.95.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.95.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.95.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.96.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.96.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.96.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.97.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.97.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.97.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.98.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.98.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.98.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.99.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.99.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.99.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.100.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.100.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.100.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.101.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.101.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.101.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.102.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.102.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.102.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.103.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.103.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.103.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.104.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.104.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.104.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.105.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.105.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.105.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.106.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.106.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.106.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.107.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.107.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.107.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.108.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.108.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.108.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.109.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.109.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.109.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.110.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.110.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.110.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.111.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.111.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.111.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.112.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.112.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.112.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.113.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.113.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.113.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.114.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.114.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.114.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.115.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.115.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.115.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.116.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.116.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.116.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.117.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.117.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.117.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.118.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.118.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.118.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.119.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.119.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.119.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.120.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.120.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.120.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.121.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.121.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.121.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.122.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.122.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.122.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.123.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.123.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.123.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.124.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.124.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.124.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.125.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.125.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.125.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.126.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.126.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.126.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.127.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.127.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.127.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.128.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.128.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.128.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.129.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.129.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.129.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.129.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.129.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.130.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.130.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.130.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.130.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.130.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.131.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.131.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.131.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.132.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.132.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.132.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.133.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.133.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.133.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.134.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.134.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.134.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.135.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.135.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.135.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.136.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.136.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.136.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.137.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.137.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.137.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.138.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.138.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.138.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.139.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.139.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.139.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.140.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.140.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.140.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.141.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.141.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.141.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.142.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.142.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.142.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.143.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.143.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.143.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.144.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.144.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.144.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.145.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.145.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.145.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.146.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.146.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.146.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.147.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.147.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.147.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.148.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.148.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.148.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.149.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.149.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.149.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.150.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.150.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.150.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.151.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.151.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.151.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.152.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.152.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.152.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.153.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.153.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.153.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.154.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.154.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.154.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.155.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.155.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.155.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.156.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.156.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.156.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.157.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.157.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.157.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.158.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.158.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.158.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.159.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.159.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.159.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.160.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.160.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.160.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.160.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.160.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.160.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.161.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.161.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.161.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.161.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.161.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.161.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.162.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.162.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.162.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.162.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.162.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.162.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.163.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.163.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.163.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.163.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.163.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.163.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.164.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.164.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.164.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.164.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.164.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.164.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.165.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.165.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.165.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.165.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.165.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.165.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.166.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.166.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.166.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.166.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.166.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.166.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.167.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.167.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.167.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.167.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.167.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.167.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.168.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.168.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.168.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.168.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.168.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.168.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.169.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.169.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.169.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.169.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.169.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.169.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.170.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.170.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.170.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.170.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.170.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.170.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.171.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.171.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.171.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.171.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.171.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.171.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.172.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.172.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.172.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.172.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.172.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.172.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.173.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.173.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.173.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.173.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.173.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.173.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.174.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.174.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.174.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.174.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.174.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.174.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.175.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.175.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.175.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.175.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.175.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.175.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.176.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.176.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.176.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.176.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.176.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.176.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.177.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.177.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.177.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.177.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.177.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.177.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.178.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.178.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.178.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.178.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.178.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.178.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.179.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.179.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.179.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.179.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.179.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.179.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.180.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.180.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.180.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.180.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.180.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.180.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.181.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.181.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.181.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.181.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.181.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.181.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.182.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.182.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.182.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.182.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.182.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.182.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.183.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.183.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.183.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.183.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.183.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.183.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.184.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.184.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.184.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.184.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.184.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.184.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.185.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.185.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.185.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.185.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.185.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.185.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.186.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.186.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.186.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.186.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.186.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.186.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.187.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.187.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.187.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.187.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.187.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.187.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.188.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.188.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.188.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.188.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.188.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.188.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.189.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.189.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.189.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.189.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.189.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.189.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.190.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.190.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.190.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.190.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.190.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.190.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.191.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.191.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.191.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.191.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.191.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.191.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.192.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.192.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.192.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.192.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.192.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.192.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.193.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.193.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.193.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.193.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.193.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.193.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.194.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.194.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.194.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.194.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.194.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.194.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.195.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.195.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.195.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.195.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.195.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.195.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.196.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.196.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.196.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.196.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.196.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.196.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.197.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.197.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.197.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.197.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.197.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.197.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.198.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.198.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.198.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.198.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.198.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.198.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.199.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.199.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.199.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.199.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.199.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.199.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.200.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.200.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.200.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.200.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.200.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.200.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.201.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.201.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.201.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.201.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.201.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.201.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.202.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.202.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.202.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.202.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.202.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.202.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.203.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.203.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.203.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.203.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.203.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.203.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.204.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.204.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.204.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.204.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.204.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.204.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.205.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.205.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.205.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.205.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.205.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.205.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.206.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.206.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.206.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.206.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.206.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.206.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.207.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.207.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.207.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.207.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.207.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.207.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.208.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.208.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.208.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.208.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.208.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.208.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.209.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.209.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.209.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.209.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.209.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.209.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.210.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.210.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.210.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.210.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.210.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.210.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.211.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.211.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.211.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.211.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.211.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.211.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.212.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.212.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.212.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.212.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.212.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.212.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.213.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.213.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.213.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.213.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.213.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.213.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.214.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.214.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.214.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.214.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.214.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.214.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.215.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.215.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.215.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.215.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.215.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.215.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.216.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.216.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.216.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.216.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.216.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.216.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.217.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.217.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.217.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.217.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.217.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.217.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.218.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.218.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.218.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.218.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.218.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.218.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.219.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.219.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.219.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.219.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.219.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.219.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.220.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.220.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.220.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.220.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.220.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.220.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.221.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.221.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.221.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.221.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.221.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.221.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.222.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.222.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.222.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.222.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.222.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.222.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.223.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.223.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.223.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.223.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.223.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.223.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.224.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.224.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.224.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.224.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.224.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.224.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.225.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.225.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.225.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.225.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.225.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.225.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.226.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.226.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.226.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.226.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.226.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.226.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.227.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.227.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.227.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.227.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.227.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.227.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.228.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.228.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.228.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.228.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.228.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.228.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.229.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.229.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.229.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.229.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.229.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.229.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.230.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.230.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.230.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.230.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.230.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.230.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.231.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.231.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.231.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.231.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.231.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.231.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.232.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.232.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.232.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.232.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.232.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.232.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.233.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.233.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.233.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.233.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.233.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.233.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.234.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.234.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.234.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.234.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.234.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.234.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.235.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.235.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.235.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.235.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.235.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.235.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.236.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.236.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.236.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.236.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.236.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.236.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.237.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.237.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.237.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.237.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.237.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.237.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.238.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.238.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.238.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.238.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.238.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.238.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.239.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.239.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.239.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.239.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.239.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.239.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.240.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.240.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.240.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.240.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.240.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.240.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.241.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.241.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.241.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.241.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.241.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.241.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.242.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.242.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.242.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.242.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.242.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.242.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.243.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.243.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.243.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.243.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.243.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.243.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.244.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.244.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.244.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.244.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.244.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.244.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.245.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.245.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.245.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.245.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.245.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.245.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.246.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.246.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.246.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.246.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.246.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.246.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.247.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.247.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.247.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.247.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.247.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.247.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.248.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.248.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.248.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.248.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.248.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.248.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.249.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.249.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.249.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.249.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.249.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.249.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.250.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.250.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.250.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.250.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.250.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.250.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.251.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.251.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.251.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.251.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.251.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.251.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.252.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.252.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.252.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.252.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.252.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.252.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.253.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.253.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.253.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.253.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.253.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.253.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.254.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.254.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.254.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.254.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.254.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.254.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.255.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.255.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.255.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.255.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.255.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.255.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.input_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.3.post_attention_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.q_a_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.q_a_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.q_a_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.q_b_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.q_b_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.kv_b_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.kv_b_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.o_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.gate.weight": "model-00004-of-000163.safetensors", "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-000163.safetensors", "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.shared_experts.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.shared_experts.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.0.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.0.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.0.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.0.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.1.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.1.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.1.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.1.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.2.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.2.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.2.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.2.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.3.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.3.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.3.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.3.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.4.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.4.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.4.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.4.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.5.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.5.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.5.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.5.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.6.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.6.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.6.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.6.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.7.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.7.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.7.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.7.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.8.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.8.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.8.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.8.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.9.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.9.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.9.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.9.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.10.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.10.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.10.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.10.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.11.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.11.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.11.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.11.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.12.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.12.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.12.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.12.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.13.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.13.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.13.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.13.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.14.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.14.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.14.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.14.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.15.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.15.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.15.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.15.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.16.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.16.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.16.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.16.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.17.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.17.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.17.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.17.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.18.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.18.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.18.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.18.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.19.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.19.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.19.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.19.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.20.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.20.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.20.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.20.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.21.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.21.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.21.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.21.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.22.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.22.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.22.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.22.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.23.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.23.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.23.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.23.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.24.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.24.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.24.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.24.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.25.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.25.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.25.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.25.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.26.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.26.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.26.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.26.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.27.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.27.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.27.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.27.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.28.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.28.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.28.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.28.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.29.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.29.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.29.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.29.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.30.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.30.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.30.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.30.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.31.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.31.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.31.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.31.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.32.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.32.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.32.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.32.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.33.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.33.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.33.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.33.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.34.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.34.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.34.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.34.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.35.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.35.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.35.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.35.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.36.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.36.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.36.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.36.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.37.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.37.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.37.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.37.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.38.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.38.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.38.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.38.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.39.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.39.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.39.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.39.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.40.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.40.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.40.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.40.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.41.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.41.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.41.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.41.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.42.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.42.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.42.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.42.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.43.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.43.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.43.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.43.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.44.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.44.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.44.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.44.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.45.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.45.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.45.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.45.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.46.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.46.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.46.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.46.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.47.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.47.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.47.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.47.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.48.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.48.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.48.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.48.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.49.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.49.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.49.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.49.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.50.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.50.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.50.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.50.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.51.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.51.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.51.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.51.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.52.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.52.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.52.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.52.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.53.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.53.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.53.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.53.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.54.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.54.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.54.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.54.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.55.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.55.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.55.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.55.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.56.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.56.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.56.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.56.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.57.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.57.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.57.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.57.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.58.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.58.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.58.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.58.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.59.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.59.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.59.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.59.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.60.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.60.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.60.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.60.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.61.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.61.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.61.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.61.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.62.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.62.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.62.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.62.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.63.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.63.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.63.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.64.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.64.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.64.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.65.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.65.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.65.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.66.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.66.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.66.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.67.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.67.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.67.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.68.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.68.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.68.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.69.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.69.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.69.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.70.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.70.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.70.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.71.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.71.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.71.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.72.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.72.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.72.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.73.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.73.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.73.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.74.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.74.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.74.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.75.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.75.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.75.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.76.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.76.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.76.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.77.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.77.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.77.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.78.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.78.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.78.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.79.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.79.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.79.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.80.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.80.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.80.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.81.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.81.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.81.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.82.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.82.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.82.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.83.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.83.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.83.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.84.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.84.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.84.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.85.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.85.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.85.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.86.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.86.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.86.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.87.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.87.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.87.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.88.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.88.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.88.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.89.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.89.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.89.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.90.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.90.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.90.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.91.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.91.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.91.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.92.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.92.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.92.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.93.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.93.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.93.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.94.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.94.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.94.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.95.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.95.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.95.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.96.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.96.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.96.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.97.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.97.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.97.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.98.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.98.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.98.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.99.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.99.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.99.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.100.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.100.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.100.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.101.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.101.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.101.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.102.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.102.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.102.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.103.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.103.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.103.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.104.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.104.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.104.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.105.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.105.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.105.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.106.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.106.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.106.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.107.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.107.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.107.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.108.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.108.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.108.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.109.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.109.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.109.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.110.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.110.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.110.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.111.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.111.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.111.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.112.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.112.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.112.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.113.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.113.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.113.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.114.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.114.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.114.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.115.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.115.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.115.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.116.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.116.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.116.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.117.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.117.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.117.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.118.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.118.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.118.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.119.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.119.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.119.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.120.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.120.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.120.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.121.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.121.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.121.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.122.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.122.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.122.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.123.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.123.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.123.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.124.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.124.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.124.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.125.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.125.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.125.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.126.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.126.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.126.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.127.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.127.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.127.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.128.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.128.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.128.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.129.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.129.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.129.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.130.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.130.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.130.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.131.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.131.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.131.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.132.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.132.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.132.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.133.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.133.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.133.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.134.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.134.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.134.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.135.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.135.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.135.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.136.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.136.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.136.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.137.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.137.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.137.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.138.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.138.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.138.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.139.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.139.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.139.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.140.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.140.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.140.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.141.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.141.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.141.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.142.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.142.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.142.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.143.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.143.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.143.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.144.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.144.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.144.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.145.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.145.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.145.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.146.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.146.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.146.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.147.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.147.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.147.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.148.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.148.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.148.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.149.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.149.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.149.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.150.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.150.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.150.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.151.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.151.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.151.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.152.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.152.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.152.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.153.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.153.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.153.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.154.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.154.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.154.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.155.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.155.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.155.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.156.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.156.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.156.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.157.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.157.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.157.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.158.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.158.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.158.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.159.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.159.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.159.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.160.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.160.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.160.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.160.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.160.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.160.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.161.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.161.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.161.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.161.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.161.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.161.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.162.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.162.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.162.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.162.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.162.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.162.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.163.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.163.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.163.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.163.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.163.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.163.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.164.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.164.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.164.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.164.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.164.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.164.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.165.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.165.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.165.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.165.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.165.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.165.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.166.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.166.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.166.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.166.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.166.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.166.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.167.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.167.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.167.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.167.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.167.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.167.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.168.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.168.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.168.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.168.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.168.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.168.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.169.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.169.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.169.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.169.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.169.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.169.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.170.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.170.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.170.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.170.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.170.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.170.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.171.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.171.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.171.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.171.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.171.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.171.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.172.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.172.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.172.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.172.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.172.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.172.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.173.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.173.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.173.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.173.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.173.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.173.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.174.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.174.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.174.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.174.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.174.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.174.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.175.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.175.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.175.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.175.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.175.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.175.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.176.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.176.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.176.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.176.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.176.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.176.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.177.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.177.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.177.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.177.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.177.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.177.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.178.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.178.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.178.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.178.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.178.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.178.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.179.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.179.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.179.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.179.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.179.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.179.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.180.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.180.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.180.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.180.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.180.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.180.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.181.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.181.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.181.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.181.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.181.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.181.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.182.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.182.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.182.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.182.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.182.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.182.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.183.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.183.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.183.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.183.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.183.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.183.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.184.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.184.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.184.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.184.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.184.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.184.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.185.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.185.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.185.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.185.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.185.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.185.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.186.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.186.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.186.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.186.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.186.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.186.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.187.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.187.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.187.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.187.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.187.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.187.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.188.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.188.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.188.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.188.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.188.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.188.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.189.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.189.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.189.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.189.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.189.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.189.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.190.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.190.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.190.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.190.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.190.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.190.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.191.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.191.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.191.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.191.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.191.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.191.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.192.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.192.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.192.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.192.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.192.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.192.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.193.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.193.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.193.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.193.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.193.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.193.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.194.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.194.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.194.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.194.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.194.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.194.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.195.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.195.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.195.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.195.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.195.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.195.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.196.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.196.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.196.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.196.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.196.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.196.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.197.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.197.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.197.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.197.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.197.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.197.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.198.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.198.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.198.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.198.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.198.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.198.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.199.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.199.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.199.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.199.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.199.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.199.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.200.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.200.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.200.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.200.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.200.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.200.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.201.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.201.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.201.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.201.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.201.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.201.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.202.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.202.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.202.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.202.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.202.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.202.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.203.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.203.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.203.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.203.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.203.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.203.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.204.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.204.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.204.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.204.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.204.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.204.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.205.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.205.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.205.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.205.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.205.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.205.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.206.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.206.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.206.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.206.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.206.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.206.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.207.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.207.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.207.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.207.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.207.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.207.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.208.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.208.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.208.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.208.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.208.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.208.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.209.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.209.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.209.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.209.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.209.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.209.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.210.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.210.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.210.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.210.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.210.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.210.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.211.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.211.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.211.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.211.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.211.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.211.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.212.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.212.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.212.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.212.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.212.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.212.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.213.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.213.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.213.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.213.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.213.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.213.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.214.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.214.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.214.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.214.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.214.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.214.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.215.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.215.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.215.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.215.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.215.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.215.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.216.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.216.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.216.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.216.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.216.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.216.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.217.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.217.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.217.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.217.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.217.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.217.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.218.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.218.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.218.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.218.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.218.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.218.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.219.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.219.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.219.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.219.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.219.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.219.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.220.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.220.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.220.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.220.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.220.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.220.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.221.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.221.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.221.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.221.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.221.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.221.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.222.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.222.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.222.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.222.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.222.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.222.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.223.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.223.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.223.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.223.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.223.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.223.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.224.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.224.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.224.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.224.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.224.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.224.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.225.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.225.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.225.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.225.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.225.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.225.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.226.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.226.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.226.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.226.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.226.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.226.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.227.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.227.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.227.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.227.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.227.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.227.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.228.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.228.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.228.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.228.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.228.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.228.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.229.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.229.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.229.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.229.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.229.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.229.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.230.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.230.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.230.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.230.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.230.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.230.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.231.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.231.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.231.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.231.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.231.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.231.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.232.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.232.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.232.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.232.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.232.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.232.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.233.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.233.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.233.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.233.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.233.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.233.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.234.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.234.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.234.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.234.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.234.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.234.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.235.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.235.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.235.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.235.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.235.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.235.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.236.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.236.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.236.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.236.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.236.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.236.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.237.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.237.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.237.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.237.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.237.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.237.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.238.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.238.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.238.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.238.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.238.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.238.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.239.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.239.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.239.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.239.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.239.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.239.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.240.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.240.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.240.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.240.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.240.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.240.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.241.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.241.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.241.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.241.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.241.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.241.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.242.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.242.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.242.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.242.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.242.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.242.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.243.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.243.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.243.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.243.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.243.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.243.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.244.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.244.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.244.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.244.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.244.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.244.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.245.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.245.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.245.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.245.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.245.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.245.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.246.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.246.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.246.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.246.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.246.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.246.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.247.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.247.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.247.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.247.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.247.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.247.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.248.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.248.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.248.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.248.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.248.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.248.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.249.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.249.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.249.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.249.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.249.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.249.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.250.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.250.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.250.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.250.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.250.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.250.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.251.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.251.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.251.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.251.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.251.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.251.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.252.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.252.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.252.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.252.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.252.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.252.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.253.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.253.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.253.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.253.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.253.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.253.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.254.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.254.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.254.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.254.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.254.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.254.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.255.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.255.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.255.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.255.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.255.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.255.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.input_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.4.post_attention_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.q_a_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.q_a_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.q_a_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.q_b_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.q_b_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.kv_b_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.kv_b_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.o_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.gate.weight": "model-00007-of-000163.safetensors", "model.layers.5.mlp.gate.e_score_correction_bias": "model-00007-of-000163.safetensors", "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.shared_experts.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.shared_experts.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.0.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.0.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.0.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.0.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.0.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.1.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.1.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.1.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.1.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.1.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.2.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.2.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.2.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.2.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.2.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.3.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.3.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.3.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.3.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.3.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.4.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.4.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.4.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.4.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.4.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.5.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.5.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.5.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.5.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.5.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.6.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.6.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.6.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.6.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.6.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.7.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.7.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.7.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.7.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.7.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.8.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.8.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.8.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.8.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.8.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.9.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.9.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.9.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.9.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.9.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.10.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.10.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.10.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.10.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.10.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.11.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.11.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.11.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.11.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.11.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.12.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.12.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.12.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.12.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.12.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.13.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.13.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.13.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.13.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.13.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.14.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.14.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.14.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.14.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.14.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.15.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.15.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.15.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.15.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.15.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.16.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.16.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.16.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.16.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.16.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.17.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.17.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.17.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.17.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.17.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.18.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.18.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.18.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.18.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.18.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.19.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.19.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.19.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.19.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.19.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.20.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.20.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.20.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.20.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.20.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.21.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.21.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.21.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.21.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.21.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.22.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.22.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.22.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.22.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.22.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.23.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.23.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.23.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.23.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.23.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.24.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.24.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.24.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.24.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.24.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.25.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.25.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.25.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.25.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.25.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.26.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.26.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.26.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.26.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.26.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.27.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.27.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.27.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.27.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.27.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.28.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.28.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.28.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.28.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.28.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.29.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.29.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.29.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.29.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.29.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.30.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.30.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.30.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.30.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.30.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.31.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.31.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.31.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.31.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.31.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.32.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.32.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.32.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.32.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.32.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.33.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.33.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.33.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.33.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.33.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.34.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.34.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.34.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.34.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.34.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.35.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.35.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.35.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.35.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.35.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.36.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.36.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.36.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.36.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.36.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.37.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.37.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.37.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.37.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.37.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.38.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.38.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.38.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.38.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.38.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.39.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.39.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.39.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.39.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.39.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.40.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.40.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.40.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.40.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.40.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.41.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.41.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.41.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.41.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.41.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.42.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.42.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.42.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.42.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.42.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.43.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.43.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.43.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.43.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.43.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.44.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.44.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.44.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.44.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.44.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.45.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.45.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.45.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.45.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.45.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.46.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.46.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.46.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.46.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.46.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.47.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.47.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.47.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.47.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.47.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.48.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.48.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.48.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.48.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.48.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.49.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.49.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.49.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.49.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.49.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.50.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.50.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.50.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.50.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.50.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.51.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.51.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.51.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.51.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.51.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.52.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.52.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.52.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.52.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.52.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.53.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.53.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.53.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.53.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.53.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.54.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.54.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.54.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.54.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.54.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.55.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.55.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.55.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.55.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.55.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.56.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.56.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.56.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.56.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.56.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.57.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.57.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.57.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.57.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.57.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.58.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.58.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.58.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.58.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.58.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.59.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.59.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.59.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.59.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.59.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.60.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.60.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.60.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.60.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.60.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.61.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.61.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.61.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.61.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.61.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.62.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.62.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.62.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.62.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.62.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.63.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.63.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.63.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.63.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.63.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.64.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.64.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.64.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.64.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.64.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.65.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.65.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.65.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.65.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.65.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.66.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.66.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.66.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.66.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.66.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.67.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.67.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.67.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.67.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.67.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.68.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.68.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.68.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.68.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.68.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.69.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.69.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.69.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.69.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.69.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.70.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.70.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.70.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.70.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.70.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.71.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.71.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.71.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.71.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.71.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.72.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.72.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.72.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.72.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.72.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.73.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.73.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.73.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.73.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.73.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.74.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.74.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.74.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.74.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.74.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.75.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.75.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.75.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.75.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.75.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.76.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.76.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.76.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.76.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.76.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.77.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.77.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.77.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.77.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.77.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.78.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.78.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.78.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.78.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.78.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.79.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.79.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.79.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.79.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.79.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.80.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.80.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.80.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.80.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.80.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.81.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.81.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.81.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.81.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.81.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.82.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.82.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.82.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.82.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.82.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.83.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.83.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.83.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.83.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.83.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.84.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.84.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.84.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.84.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.84.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.85.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.85.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.85.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.85.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.85.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.86.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.86.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.86.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.86.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.86.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.87.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.87.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.87.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.87.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.87.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.88.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.88.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.88.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.88.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.88.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.89.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.89.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.89.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.89.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.89.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.90.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.90.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.90.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.90.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.90.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.91.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.91.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.91.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.91.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.91.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.92.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.92.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.92.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.92.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.92.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.93.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.93.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.93.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.93.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.93.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.94.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.94.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.94.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.94.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.94.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.95.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.95.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.95.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.95.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.95.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.96.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.96.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.96.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.96.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.96.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.97.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.97.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.97.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.97.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.97.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.98.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.98.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.98.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.98.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.98.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.99.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.99.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.99.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.99.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.99.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.100.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.100.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.100.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.100.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.100.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.101.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.101.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.101.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.101.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.101.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.102.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.102.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.102.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.102.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.102.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.103.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.103.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.103.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.103.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.103.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.104.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.104.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.104.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.104.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.104.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.105.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.105.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.105.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.105.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.105.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.106.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.106.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.106.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.106.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.106.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.107.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.107.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.107.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.107.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.107.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.108.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.108.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.108.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.108.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.108.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.109.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.109.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.109.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.109.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.109.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.110.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.110.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.110.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.110.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.110.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.111.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.111.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.111.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.111.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.111.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.112.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.112.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.112.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.112.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.112.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.113.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.113.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.113.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.113.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.113.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.114.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.114.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.114.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.114.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.114.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.115.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.115.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.115.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.115.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.115.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.116.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.116.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.116.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.116.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.116.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.117.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.117.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.117.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.117.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.117.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.118.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.118.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.118.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.118.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.118.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.119.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.119.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.119.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.119.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.119.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.120.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.120.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.120.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.120.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.120.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.121.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.121.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.121.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.121.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.121.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.122.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.122.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.122.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.122.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.122.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.123.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.123.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.123.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.123.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.123.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.124.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.124.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.124.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.124.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.124.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.125.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.125.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.125.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.125.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.125.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.126.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.126.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.126.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.126.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.126.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.127.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.127.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.127.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.127.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.127.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.128.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.128.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.128.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.128.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.128.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.129.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.129.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.129.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.129.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.129.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.130.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.130.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.130.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.130.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.130.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.131.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.131.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.131.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.131.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.131.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.132.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.132.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.132.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.132.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.132.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.133.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.133.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.133.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.133.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.133.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.134.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.134.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.134.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.134.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.134.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.135.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.135.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.135.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.135.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.135.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.136.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.136.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.136.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.136.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.136.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.137.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.137.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.137.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.137.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.137.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.138.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.138.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.138.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.138.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.138.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.139.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.139.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.139.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.139.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.139.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.140.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.140.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.140.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.140.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.140.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.141.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.141.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.141.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.141.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.141.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.142.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.142.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.142.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.142.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.142.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.143.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.143.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.143.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.143.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.143.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.144.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.144.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.144.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.144.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.144.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.145.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.145.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.145.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.145.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.145.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.146.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.146.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.146.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.146.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.146.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.147.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.147.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.147.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.147.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.147.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.148.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.148.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.148.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.148.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.148.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.149.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.149.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.149.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.149.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.149.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.150.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.150.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.150.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.150.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.150.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.151.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.151.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.151.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.151.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.151.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.152.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.152.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.152.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.152.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.152.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.153.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.153.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.153.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.153.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.153.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.154.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.154.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.154.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.154.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.154.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.155.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.155.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.155.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.155.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.155.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.156.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.156.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.156.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.156.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.156.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.157.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.157.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.157.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.157.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.157.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.158.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.158.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.158.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.158.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.158.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.159.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.159.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.159.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.159.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.159.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.160.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.160.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.160.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.160.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.160.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.160.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.161.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.161.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.161.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.161.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.161.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.161.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.162.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.162.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.162.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.162.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.162.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.162.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.163.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.163.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.163.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.163.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.163.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.163.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.164.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.164.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.164.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.164.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.164.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.164.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.165.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.165.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.165.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.165.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.165.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.165.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.166.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.166.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.166.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.166.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.166.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.166.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.167.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.167.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.167.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.167.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.167.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.167.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.168.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.168.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.168.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.168.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.168.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.168.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.169.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.169.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.169.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.169.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.169.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.169.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.170.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.170.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.170.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.170.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.170.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.170.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.171.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.171.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.171.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.171.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.171.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.171.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.172.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.172.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.172.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.172.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.172.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.172.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.173.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.173.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.173.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.173.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.173.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.173.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.174.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.174.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.174.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.174.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.174.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.174.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.175.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.175.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.175.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.175.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.175.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.175.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.176.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.176.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.176.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.176.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.176.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.176.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.177.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.177.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.177.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.177.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.177.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.177.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.178.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.178.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.178.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.178.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.178.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.178.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.179.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.179.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.179.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.179.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.179.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.179.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.180.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.180.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.180.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.180.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.180.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.180.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.181.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.181.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.181.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.181.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.181.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.181.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.182.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.182.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.182.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.182.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.182.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.182.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.183.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.183.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.183.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.183.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.183.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.183.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.184.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.184.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.184.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.184.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.184.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.184.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.185.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.185.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.185.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.185.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.185.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.185.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.186.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.186.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.186.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.186.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.186.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.186.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.187.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.187.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.187.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.187.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.187.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.187.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.188.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.188.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.188.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.188.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.188.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.188.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.189.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.189.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.189.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.189.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.189.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.189.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.190.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.190.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.190.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.190.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.190.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.190.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.191.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.191.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.191.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.191.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.191.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.191.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.192.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.192.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.192.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.192.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.192.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.192.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.193.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.193.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.193.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.193.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.193.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.193.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.194.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.194.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.194.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.194.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.194.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.194.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.195.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.195.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.195.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.195.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.195.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.195.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.196.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.196.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.196.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.196.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.196.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.196.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.197.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.197.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.197.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.197.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.197.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.197.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.198.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.198.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.198.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.198.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.198.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.198.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.199.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.199.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.199.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.199.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.199.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.199.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.200.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.200.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.200.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.200.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.200.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.200.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.201.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.201.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.201.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.201.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.201.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.201.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.202.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.202.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.202.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.202.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.202.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.202.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.203.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.203.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.203.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.203.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.203.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.203.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.204.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.204.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.204.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.204.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.204.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.204.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.205.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.205.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.205.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.205.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.205.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.205.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.206.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.206.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.206.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.206.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.206.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.206.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.207.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.207.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.207.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.207.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.207.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.207.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.208.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.208.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.208.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.208.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.208.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.208.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.209.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.209.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.209.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.209.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.209.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.209.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.210.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.210.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.210.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.210.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.210.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.210.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.211.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.211.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.211.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.211.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.211.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.211.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.212.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.212.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.212.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.212.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.212.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.212.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.213.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.213.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.213.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.213.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.213.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.213.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.214.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.214.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.214.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.214.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.214.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.214.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.215.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.215.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.215.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.215.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.215.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.215.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.216.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.216.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.216.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.216.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.216.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.216.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.217.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.217.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.217.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.217.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.217.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.217.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.218.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.218.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.218.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.218.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.218.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.218.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.219.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.219.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.219.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.219.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.219.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.219.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.220.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.220.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.220.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.220.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.220.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.220.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.221.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.221.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.221.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.221.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.221.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.221.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.222.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.222.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.222.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.222.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.222.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.222.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.223.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.223.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.223.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.223.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.223.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.223.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.224.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.224.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.224.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.224.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.224.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.224.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.225.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.225.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.225.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.225.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.225.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.225.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.226.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.226.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.226.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.226.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.226.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.226.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.227.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.227.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.227.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.227.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.227.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.227.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.228.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.228.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.228.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.228.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.228.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.228.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.229.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.229.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.229.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.229.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.229.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.229.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.230.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.230.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.230.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.230.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.230.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.230.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.231.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.231.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.231.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.231.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.231.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.231.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.232.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.232.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.232.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.232.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.232.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.232.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.233.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.233.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.233.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.233.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.233.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.233.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.234.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.234.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.234.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.234.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.234.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.234.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.235.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.235.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.235.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.235.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.235.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.235.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.236.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.236.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.236.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.236.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.236.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.236.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.237.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.237.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.237.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.237.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.237.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.237.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.238.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.238.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.238.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.238.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.238.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.238.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.239.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.239.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.239.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.239.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.239.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.239.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.240.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.240.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.240.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.240.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.240.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.240.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.241.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.241.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.241.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.241.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.241.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.241.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.242.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.242.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.242.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.242.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.242.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.242.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.243.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.243.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.243.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.243.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.243.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.243.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.244.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.244.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.244.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.244.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.244.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.244.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.245.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.245.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.245.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.245.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.245.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.245.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.246.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.246.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.246.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.246.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.246.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.246.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.247.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.247.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.247.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.247.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.247.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.247.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.248.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.248.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.248.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.248.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.248.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.248.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.249.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.249.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.249.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.249.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.249.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.249.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.250.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.250.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.250.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.250.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.250.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.250.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.251.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.251.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.251.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.251.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.251.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.251.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.252.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.252.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.252.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.252.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.252.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.252.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.253.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.253.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.253.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.253.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.253.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.253.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.254.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.254.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.254.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.254.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.254.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.254.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.255.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.255.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.255.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.255.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.255.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.255.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.input_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.5.post_attention_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.q_a_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.q_a_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.q_a_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.q_b_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.q_b_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.kv_b_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.kv_b_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.o_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.gate.weight": "model-00009-of-000163.safetensors", "model.layers.6.mlp.gate.e_score_correction_bias": "model-00009-of-000163.safetensors", "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.shared_experts.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.shared_experts.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.0.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.0.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.0.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.0.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.0.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.1.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.1.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.1.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.1.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.1.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.2.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.2.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.2.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.2.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.2.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.3.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.3.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.3.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.3.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.3.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.4.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.4.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.4.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.4.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.4.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.5.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.5.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.5.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.5.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.5.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.6.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.6.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.6.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.6.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.6.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.7.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.7.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.7.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.7.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.7.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.8.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.8.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.8.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.8.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.8.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.9.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.9.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.9.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.9.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.9.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.10.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.10.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.10.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.10.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.10.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.11.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.11.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.11.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.11.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.11.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.12.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.12.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.12.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.12.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.12.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.13.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.13.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.13.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.13.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.13.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.14.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.14.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.14.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.14.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.14.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.15.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.15.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.15.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.15.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.15.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.16.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.16.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.16.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.16.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.16.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.17.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.17.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.17.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.17.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.17.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.18.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.18.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.18.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.18.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.18.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.19.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.19.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.19.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.19.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.19.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.20.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.20.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.20.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.20.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.20.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.21.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.21.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.21.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.21.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.21.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.22.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.22.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.22.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.22.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.22.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.23.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.23.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.23.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.23.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.23.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.24.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.24.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.24.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.24.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.24.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.25.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.25.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.25.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.25.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.25.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.26.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.26.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.26.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.26.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.26.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.27.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.27.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.27.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.27.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.27.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.28.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.28.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.28.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.28.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.28.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.29.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.29.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.29.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.29.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.29.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.30.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.30.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.30.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.30.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.30.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.31.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.31.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.31.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.31.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.31.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.32.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.32.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.32.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.32.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.32.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.33.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.33.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.33.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.33.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.33.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.34.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.34.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.34.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.34.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.34.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.35.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.35.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.35.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.35.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.35.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.36.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.36.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.36.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.36.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.36.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.37.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.37.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.37.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.37.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.37.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.38.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.38.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.38.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.38.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.38.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.39.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.39.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.39.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.39.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.39.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.40.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.40.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.40.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.40.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.40.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.41.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.41.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.41.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.41.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.41.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.42.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.42.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.42.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.42.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.42.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.43.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.43.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.43.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.43.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.43.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.44.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.44.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.44.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.44.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.44.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.45.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.45.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.45.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.45.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.45.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.46.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.46.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.46.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.46.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.46.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.47.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.47.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.47.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.47.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.47.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.48.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.48.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.48.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.48.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.48.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.49.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.49.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.49.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.49.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.49.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.50.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.50.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.50.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.50.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.50.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.51.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.51.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.51.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.51.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.51.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.52.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.52.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.52.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.52.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.52.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.53.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.53.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.53.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.53.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.53.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.54.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.54.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.54.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.54.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.54.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.55.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.55.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.55.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.55.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.55.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.56.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.56.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.56.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.56.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.56.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.57.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.57.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.57.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.57.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.57.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.58.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.58.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.58.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.58.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.58.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.59.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.59.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.59.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.59.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.59.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.60.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.60.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.60.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.60.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.60.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.61.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.61.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.61.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.61.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.61.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.62.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.62.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.62.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.62.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.62.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.63.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.63.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.63.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.63.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.63.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.64.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.64.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.64.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.64.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.64.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.65.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.65.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.65.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.65.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.65.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.66.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.66.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.66.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.66.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.66.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.67.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.67.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.67.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.67.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.67.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.68.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.68.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.68.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.68.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.68.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.69.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.69.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.69.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.69.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.69.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.70.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.70.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.70.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.70.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.70.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.71.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.71.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.71.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.71.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.71.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.72.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.72.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.72.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.72.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.72.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.73.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.73.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.73.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.73.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.73.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.74.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.74.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.74.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.74.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.74.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.75.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.75.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.75.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.75.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.75.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.76.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.76.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.76.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.76.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.76.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.77.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.77.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.77.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.77.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.77.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.78.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.78.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.78.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.78.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.78.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.79.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.79.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.79.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.79.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.79.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.80.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.80.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.80.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.80.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.80.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.81.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.81.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.81.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.81.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.81.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.82.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.82.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.82.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.82.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.82.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.83.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.83.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.83.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.83.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.83.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.84.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.84.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.84.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.84.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.84.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.85.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.85.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.85.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.85.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.85.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.86.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.86.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.86.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.86.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.86.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.87.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.87.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.87.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.87.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.87.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.88.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.88.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.88.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.88.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.88.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.89.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.89.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.89.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.89.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.89.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.90.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.90.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.90.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.90.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.90.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.91.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.91.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.91.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.91.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.91.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.92.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.92.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.92.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.92.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.92.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.93.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.93.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.93.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.93.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.93.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.94.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.94.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.94.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.94.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.94.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.95.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.95.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.95.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.95.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.95.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.96.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.96.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.96.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.96.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.96.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.97.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.97.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.97.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.97.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.97.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.98.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.98.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.98.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.98.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.98.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.99.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.99.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.99.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.99.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.99.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.100.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.100.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.100.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.100.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.100.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.101.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.101.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.101.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.101.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.101.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.102.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.102.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.102.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.102.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.102.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.103.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.103.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.103.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.103.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.103.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.104.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.104.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.104.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.104.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.104.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.105.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.105.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.105.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.105.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.105.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.106.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.106.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.106.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.106.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.106.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.107.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.107.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.107.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.107.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.107.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.108.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.108.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.108.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.108.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.108.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.109.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.109.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.109.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.109.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.109.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.110.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.110.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.110.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.110.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.110.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.111.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.111.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.111.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.111.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.111.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.112.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.112.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.112.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.112.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.112.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.113.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.113.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.113.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.113.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.113.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.114.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.114.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.114.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.114.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.114.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.115.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.115.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.115.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.115.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.115.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.116.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.116.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.116.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.116.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.116.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.117.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.117.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.117.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.117.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.117.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.118.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.118.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.118.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.118.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.118.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.119.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.119.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.119.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.119.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.119.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.120.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.120.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.120.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.120.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.120.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.121.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.121.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.121.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.121.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.121.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.122.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.122.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.122.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.122.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.122.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.123.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.123.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.123.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.123.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.123.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.124.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.124.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.124.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.124.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.124.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.125.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.125.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.125.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.125.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.125.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.126.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.126.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.126.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.126.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.126.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.127.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.127.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.127.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.127.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.127.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.128.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.128.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.128.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.128.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.128.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.129.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.129.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.129.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.129.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.129.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.130.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.130.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.130.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.130.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.130.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.131.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.131.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.131.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.131.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.131.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.132.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.132.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.132.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.132.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.132.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.133.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.133.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.133.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.133.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.133.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.134.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.134.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.134.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.134.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.134.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.135.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.135.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.135.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.135.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.135.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.136.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.136.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.136.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.136.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.136.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.137.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.137.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.137.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.137.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.137.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.138.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.138.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.138.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.138.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.138.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.139.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.139.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.139.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.139.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.139.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.140.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.140.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.140.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.140.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.140.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.141.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.141.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.141.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.141.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.141.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.142.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.142.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.142.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.142.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.142.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.143.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.143.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.143.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.143.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.143.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.144.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.144.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.144.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.144.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.144.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.145.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.145.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.145.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.145.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.145.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.146.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.146.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.146.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.146.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.146.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.147.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.147.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.147.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.147.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.147.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.148.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.148.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.148.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.148.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.148.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.149.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.149.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.149.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.149.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.149.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.150.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.150.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.150.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.150.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.150.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.151.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.151.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.151.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.151.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.151.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.152.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.152.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.152.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.152.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.152.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.153.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.153.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.153.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.153.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.153.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.154.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.154.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.154.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.154.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.154.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.155.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.155.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.155.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.155.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.155.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.156.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.156.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.156.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.156.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.156.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.157.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.157.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.157.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.157.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.157.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.158.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.158.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.158.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.158.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.158.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.159.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.159.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.159.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.159.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.159.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.160.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.160.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.160.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.160.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.160.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.160.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.161.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.161.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.161.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.161.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.161.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.161.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.162.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.162.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.162.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.162.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.162.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.162.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.163.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.163.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.163.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.163.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.163.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.163.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.164.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.164.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.164.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.164.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.164.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.164.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.165.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.165.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.165.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.165.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.165.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.165.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.166.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.166.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.166.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.166.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.166.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.166.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.167.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.167.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.167.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.167.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.167.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.167.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.168.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.168.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.168.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.168.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.168.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.168.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.169.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.169.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.169.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.169.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.169.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.169.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.170.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.170.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.170.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.170.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.170.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.170.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.171.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.171.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.171.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.171.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.171.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.171.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.172.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.172.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.172.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.172.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.172.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.172.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.173.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.173.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.173.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.173.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.173.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.173.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.174.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.174.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.174.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.174.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.174.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.174.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.175.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.175.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.175.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.175.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.175.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.175.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.176.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.176.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.176.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.176.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.176.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.176.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.177.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.177.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.177.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.177.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.177.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.177.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.178.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.178.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.178.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.178.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.178.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.178.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.179.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.179.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.179.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.179.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.179.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.179.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.180.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.180.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.180.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.180.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.180.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.180.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.181.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.181.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.181.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.181.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.181.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.181.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.182.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.182.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.182.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.182.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.182.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.182.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.183.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.183.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.183.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.183.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.183.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.183.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.184.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.184.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.184.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.184.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.184.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.184.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.185.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.185.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.185.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.185.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.185.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.185.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.186.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.186.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.186.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.186.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.186.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.186.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.187.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.187.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.187.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.187.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.187.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.187.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.188.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.188.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.188.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.188.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.188.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.188.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.189.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.189.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.189.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.189.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.189.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.189.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.190.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.190.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.190.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.190.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.190.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.190.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.191.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.191.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.191.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.191.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.191.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.191.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.192.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.192.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.192.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.192.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.192.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.192.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.193.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.193.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.193.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.193.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.193.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.193.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.194.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.194.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.194.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.194.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.194.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.194.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.195.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.195.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.195.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.195.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.195.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.195.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.196.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.196.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.196.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.196.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.196.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.196.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.197.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.197.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.197.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.197.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.197.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.197.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.198.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.198.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.198.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.198.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.198.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.198.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.199.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.199.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.199.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.199.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.199.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.199.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.200.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.200.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.200.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.200.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.200.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.200.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.201.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.201.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.201.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.201.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.201.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.201.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.202.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.202.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.202.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.202.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.202.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.202.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.203.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.203.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.203.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.203.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.203.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.203.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.204.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.204.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.204.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.204.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.204.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.204.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.205.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.205.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.205.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.205.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.205.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.205.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.206.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.206.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.206.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.206.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.206.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.206.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.207.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.207.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.207.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.207.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.207.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.207.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.208.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.208.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.208.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.208.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.208.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.208.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.209.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.209.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.209.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.209.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.209.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.209.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.210.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.210.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.210.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.210.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.210.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.210.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.211.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.211.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.211.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.211.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.211.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.211.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.212.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.212.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.212.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.212.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.212.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.212.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.213.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.213.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.213.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.213.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.213.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.213.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.214.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.214.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.214.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.214.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.214.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.214.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.215.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.215.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.215.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.215.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.215.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.215.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.216.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.216.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.216.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.216.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.216.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.216.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.217.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.217.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.217.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.217.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.217.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.217.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.218.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.218.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.218.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.218.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.218.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.218.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.219.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.219.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.219.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.219.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.219.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.219.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.220.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.220.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.220.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.220.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.220.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.220.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.221.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.221.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.221.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.221.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.221.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.221.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.222.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.222.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.222.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.222.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.222.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.222.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.223.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.223.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.223.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.223.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.223.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.223.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.224.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.224.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.224.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.224.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.224.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.224.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.225.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.225.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.225.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.225.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.225.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.225.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.226.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.226.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.226.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.226.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.226.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.226.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.227.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.227.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.227.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.227.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.227.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.227.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.228.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.228.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.228.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.228.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.228.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.228.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.229.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.229.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.229.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.229.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.229.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.229.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.230.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.230.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.230.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.230.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.230.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.230.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.231.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.231.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.231.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.231.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.231.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.231.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.232.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.232.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.232.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.232.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.232.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.232.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.233.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.233.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.233.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.233.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.233.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.233.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.234.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.234.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.234.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.234.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.234.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.234.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.235.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.235.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.235.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.235.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.235.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.235.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.236.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.236.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.236.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.236.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.236.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.236.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.237.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.237.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.237.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.237.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.237.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.237.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.238.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.238.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.238.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.238.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.238.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.238.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.239.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.239.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.239.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.239.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.239.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.239.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.240.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.240.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.240.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.240.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.240.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.240.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.241.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.241.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.241.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.241.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.241.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.241.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.242.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.242.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.242.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.242.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.242.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.242.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.243.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.243.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.243.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.243.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.243.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.243.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.244.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.244.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.244.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.244.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.244.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.244.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.245.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.245.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.245.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.245.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.245.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.245.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.246.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.246.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.246.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.246.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.246.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.246.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.247.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.247.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.247.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.247.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.247.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.247.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.248.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.248.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.248.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.248.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.248.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.248.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.249.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.249.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.249.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.249.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.249.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.249.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.250.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.250.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.250.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.250.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.250.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.250.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.251.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.251.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.251.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.251.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.251.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.251.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.252.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.252.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.252.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.252.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.252.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.252.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.253.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.253.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.253.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.253.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.253.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.253.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.254.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.254.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.254.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.254.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.254.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.254.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.255.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.255.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.255.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.255.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.255.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.255.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.input_layernorm.weight": "model-00012-of-000163.safetensors", "model.layers.6.post_attention_layernorm.weight": "model-00012-of-000163.safetensors", "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.q_a_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.q_b_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.kv_b_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.o_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.gate.weight": "model-00013-of-000163.safetensors", "model.layers.7.mlp.gate.e_score_correction_bias": "model-00013-of-000163.safetensors", "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.shared_experts.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.shared_experts.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.0.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.0.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.0.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.1.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.1.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.1.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.2.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.2.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.2.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.3.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.3.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.3.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.4.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.4.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.4.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.5.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.5.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.5.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.6.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.6.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.6.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.6.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.7.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.7.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.7.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.7.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.7.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.8.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.8.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.8.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.8.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.8.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.9.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.9.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.9.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.9.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.9.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.10.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.10.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.10.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.10.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.10.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.11.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.11.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.11.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.11.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.11.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.12.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.12.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.12.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.12.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.12.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.13.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.13.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.13.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.13.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.13.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.14.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.14.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.14.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.14.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.14.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.15.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.15.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.15.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.15.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.15.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.16.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.16.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.16.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.16.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.16.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.17.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.17.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.17.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.17.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.17.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.18.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.18.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.18.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.18.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.18.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.19.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.19.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.19.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.19.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.19.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.20.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.20.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.20.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.20.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.20.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.21.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.21.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.21.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.21.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.21.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.22.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.22.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.22.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.22.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.22.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.23.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.23.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.23.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.23.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.23.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.24.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.24.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.24.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.24.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.24.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.25.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.25.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.25.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.25.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.25.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.26.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.26.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.26.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.26.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.26.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.27.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.27.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.27.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.27.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.27.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.28.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.28.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.28.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.28.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.28.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.29.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.29.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.29.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.29.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.29.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.30.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.30.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.30.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.30.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.30.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.31.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.31.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.31.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.31.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.31.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.32.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.32.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.32.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.32.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.32.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.33.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.33.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.33.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.33.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.33.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.34.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.34.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.34.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.34.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.34.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.35.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.35.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.35.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.35.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.35.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.36.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.36.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.36.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.36.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.36.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.37.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.37.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.37.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.37.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.37.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.38.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.38.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.38.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.38.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.38.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.39.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.39.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.39.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.39.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.39.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.40.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.40.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.40.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.40.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.40.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.41.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.41.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.41.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.41.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.41.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.42.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.42.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.42.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.42.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.42.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.43.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.43.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.43.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.43.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.43.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.44.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.44.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.44.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.44.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.44.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.45.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.45.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.45.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.45.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.45.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.46.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.46.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.46.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.46.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.46.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.47.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.47.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.47.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.47.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.47.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.48.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.48.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.48.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.48.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.48.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.49.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.49.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.49.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.49.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.49.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.50.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.50.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.50.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.50.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.50.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.51.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.51.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.51.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.51.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.51.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.52.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.52.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.52.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.52.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.52.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.53.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.53.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.53.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.53.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.53.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.54.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.54.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.54.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.54.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.54.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.55.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.55.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.55.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.55.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.55.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.56.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.56.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.56.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.56.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.56.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.57.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.57.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.57.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.57.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.57.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.58.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.58.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.58.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.58.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.58.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.59.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.59.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.59.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.59.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.59.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.60.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.60.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.60.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.60.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.60.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.61.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.61.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.61.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.61.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.61.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.62.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.62.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.62.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.62.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.62.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.63.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.63.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.63.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.63.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.63.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.64.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.64.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.64.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.64.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.64.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.65.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.65.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.65.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.65.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.65.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.66.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.66.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.66.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.66.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.66.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.67.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.67.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.67.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.67.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.67.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.68.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.68.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.68.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.68.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.68.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.69.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.69.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.69.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.69.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.69.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.70.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.70.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.70.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.70.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.70.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.71.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.71.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.71.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.71.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.71.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.72.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.72.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.72.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.72.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.72.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.73.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.73.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.73.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.73.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.73.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.74.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.74.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.74.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.74.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.74.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.75.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.75.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.75.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.75.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.75.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.76.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.76.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.76.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.76.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.76.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.77.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.77.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.77.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.77.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.77.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.78.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.78.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.78.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.78.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.78.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.79.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.79.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.79.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.79.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.79.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.80.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.80.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.80.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.80.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.80.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.81.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.81.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.81.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.81.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.81.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.82.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.82.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.82.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.82.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.82.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.83.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.83.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.83.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.83.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.83.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.84.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.84.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.84.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.84.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.84.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.85.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.85.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.85.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.85.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.85.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.86.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.86.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.86.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.86.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.86.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.87.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.87.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.87.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.87.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.87.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.88.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.88.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.88.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.88.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.88.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.89.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.89.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.89.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.89.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.89.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.90.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.90.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.90.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.90.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.90.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.91.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.91.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.91.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.91.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.91.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.92.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.92.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.92.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.92.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.92.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.93.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.93.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.93.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.93.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.93.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.94.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.94.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.94.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.94.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.94.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.95.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.95.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.95.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.95.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.95.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.96.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.96.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.96.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.96.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.96.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.97.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.97.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.97.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.97.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.97.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.98.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.98.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.98.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.98.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.98.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.99.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.99.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.99.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.99.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.99.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.100.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.100.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.100.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.100.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.100.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.101.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.101.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.101.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.101.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.101.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.102.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.102.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.102.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.102.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.102.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.103.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.103.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.103.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.103.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.103.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.104.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.104.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.104.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.104.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.104.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.105.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.105.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.105.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.105.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.105.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.106.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.106.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.106.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.106.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.106.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.107.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.107.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.107.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.107.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.107.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.108.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.108.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.108.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.108.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.108.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.109.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.109.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.109.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.109.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.109.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.110.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.110.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.110.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.110.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.110.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.111.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.111.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.111.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.111.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.111.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.112.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.112.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.112.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.112.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.112.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.113.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.113.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.113.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.113.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.113.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.114.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.114.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.114.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.114.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.114.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.115.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.115.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.115.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.115.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.115.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.116.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.116.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.116.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.116.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.116.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.117.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.117.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.117.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.117.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.117.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.118.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.118.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.118.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.118.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.118.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.119.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.119.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.119.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.119.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.119.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.120.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.120.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.120.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.120.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.120.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.121.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.121.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.121.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.121.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.121.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.122.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.122.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.122.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.122.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.122.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.123.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.123.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.123.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.123.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.123.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.124.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.124.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.124.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.124.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.124.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.125.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.125.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.125.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.125.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.125.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.126.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.126.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.126.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.126.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.126.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.127.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.127.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.127.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.127.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.127.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.128.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.128.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.128.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.128.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.128.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.129.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.129.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.129.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.129.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.129.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.130.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.130.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.130.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.130.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.130.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.131.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.131.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.131.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.131.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.131.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.132.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.132.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.132.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.132.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.132.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.133.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.133.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.133.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.133.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.133.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.134.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.134.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.134.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.134.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.134.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.135.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.135.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.135.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.135.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.135.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.136.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.136.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.136.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.136.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.136.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.137.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.137.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.137.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.137.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.137.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.138.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.138.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.138.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.138.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.138.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.139.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.139.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.139.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.139.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.139.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.140.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.140.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.140.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.140.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.140.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.141.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.141.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.141.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.141.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.141.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.142.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.142.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.142.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.142.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.142.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.143.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.143.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.143.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.143.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.143.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.144.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.144.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.144.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.144.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.144.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.145.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.145.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.145.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.145.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.145.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.146.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.146.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.146.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.146.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.146.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.147.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.147.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.147.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.147.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.147.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.148.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.148.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.148.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.148.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.148.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.149.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.149.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.149.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.149.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.149.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.150.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.150.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.150.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.150.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.150.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.151.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.151.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.151.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.151.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.151.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.152.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.152.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.152.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.152.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.152.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.153.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.153.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.153.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.153.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.153.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.154.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.154.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.154.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.154.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.154.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.155.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.155.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.155.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.155.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.155.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.156.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.156.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.156.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.156.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.156.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.157.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.157.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.157.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.157.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.157.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.158.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.158.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.158.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.158.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.158.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.159.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.159.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.159.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.159.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.159.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.160.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.160.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.160.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.160.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.160.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.160.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.161.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.161.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.161.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.161.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.161.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.161.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.162.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.162.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.162.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.162.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.162.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.162.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.163.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.163.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.163.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.163.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.163.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.163.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.164.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.164.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.164.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.164.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.164.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.164.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.165.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.165.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.165.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.165.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.165.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.165.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.166.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.166.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.166.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.166.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.166.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.166.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.167.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.167.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.167.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.167.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.167.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.167.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.168.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.168.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.168.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.168.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.168.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.168.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.169.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.169.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.169.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.169.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.169.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.169.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.170.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.170.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.170.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.170.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.170.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.170.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.171.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.171.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.171.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.171.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.171.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.171.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.172.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.172.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.172.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.172.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.172.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.172.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.173.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.173.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.173.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.173.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.173.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.173.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.174.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.174.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.174.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.174.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.174.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.174.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.175.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.175.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.175.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.175.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.175.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.175.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.176.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.176.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.176.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.176.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.176.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.176.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.177.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.177.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.177.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.177.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.177.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.177.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.178.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.178.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.178.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.178.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.178.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.178.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.179.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.179.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.179.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.179.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.179.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.179.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.180.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.180.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.180.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.180.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.180.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.180.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.181.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.181.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.181.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.181.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.181.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.181.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.182.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.182.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.182.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.182.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.182.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.182.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.183.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.183.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.183.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.183.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.183.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.183.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.184.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.184.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.184.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.184.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.184.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.184.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.185.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.185.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.185.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.185.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.185.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.185.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.186.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.186.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.186.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.186.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.186.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.186.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.187.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.187.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.187.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.187.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.187.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.187.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.188.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.188.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.188.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.188.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.188.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.188.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.189.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.189.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.189.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.189.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.189.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.189.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.190.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.190.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.190.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.190.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.190.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.190.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.191.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.191.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.191.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.191.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.191.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.191.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.192.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.192.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.192.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.192.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.192.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.192.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.193.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.193.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.193.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.193.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.193.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.193.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.194.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.194.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.194.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.194.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.194.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.194.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.195.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.195.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.195.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.195.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.195.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.195.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.196.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.196.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.196.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.196.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.196.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.196.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.197.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.197.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.197.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.197.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.197.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.197.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.198.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.198.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.198.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.198.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.198.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.198.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.199.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.199.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.199.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.199.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.199.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.199.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.200.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.200.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.200.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.200.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.200.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.200.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.201.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.201.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.201.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.201.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.201.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.201.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.202.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.202.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.202.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.202.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.202.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.202.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.203.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.203.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.203.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.203.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.203.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.203.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.204.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.204.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.204.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.204.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.204.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.204.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.205.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.205.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.205.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.205.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.205.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.205.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.206.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.206.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.206.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.206.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.206.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.206.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.207.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.207.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.207.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.207.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.207.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.207.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.208.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.208.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.208.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.208.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.208.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.208.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.209.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.209.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.209.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.209.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.209.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.209.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.210.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.210.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.210.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.210.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.210.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.210.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.211.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.211.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.211.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.211.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.211.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.211.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.212.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.212.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.212.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.212.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.212.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.212.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.213.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.213.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.213.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.213.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.213.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.213.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.214.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.214.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.214.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.214.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.214.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.214.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.215.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.215.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.215.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.215.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.215.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.215.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.216.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.216.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.216.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.216.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.216.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.216.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.217.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.217.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.217.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.217.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.217.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.217.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.218.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.218.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.218.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.218.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.218.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.218.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.219.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.219.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.219.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.219.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.219.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.219.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.220.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.220.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.220.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.220.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.220.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.220.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.221.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.221.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.221.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.221.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.221.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.221.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.222.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.222.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.222.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.222.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.222.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.222.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.223.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.223.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.223.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.223.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.223.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.223.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.224.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.224.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.224.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.224.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.224.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.224.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.225.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.225.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.225.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.225.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.225.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.225.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.226.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.226.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.226.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.226.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.226.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.226.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.227.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.227.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.227.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.227.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.227.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.227.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.228.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.228.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.228.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.228.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.228.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.228.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.229.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.229.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.229.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.229.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.229.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.229.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.230.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.230.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.230.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.230.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.230.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.230.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.231.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.231.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.231.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.231.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.231.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.231.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.232.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.232.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.232.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.232.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.232.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.232.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.233.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.233.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.233.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.233.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.233.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.233.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.234.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.234.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.234.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.234.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.234.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.234.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.235.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.235.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.235.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.235.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.235.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.235.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.236.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.236.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.236.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.236.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.236.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.236.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.237.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.237.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.237.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.237.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.237.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.237.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.238.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.238.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.238.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.238.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.238.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.238.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.239.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.239.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.239.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.239.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.239.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.239.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.240.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.240.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.240.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.240.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.240.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.240.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.241.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.241.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.241.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.241.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.241.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.241.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.242.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.242.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.242.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.242.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.242.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.242.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.243.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.243.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.243.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.243.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.243.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.243.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.244.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.244.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.244.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.244.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.244.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.244.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.245.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.245.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.245.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.245.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.245.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.245.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.246.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.246.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.246.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.246.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.246.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.246.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.247.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.247.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.247.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.247.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.247.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.247.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.248.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.248.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.248.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.248.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.248.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.248.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.249.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.249.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.249.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.249.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.249.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.249.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.250.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.250.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.250.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.250.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.250.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.250.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.251.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.251.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.251.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.251.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.251.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.251.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.252.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.252.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.252.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.252.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.252.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.252.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.253.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.253.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.253.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.253.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.253.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.253.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.254.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.254.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.254.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.254.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.254.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.254.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.255.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.255.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.255.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.255.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.255.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.255.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.input_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.7.post_attention_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.q_a_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.q_a_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.q_a_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.q_b_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.q_b_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.kv_b_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.kv_b_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.o_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.gate.weight": "model-00015-of-000163.safetensors", "model.layers.8.mlp.gate.e_score_correction_bias": "model-00015-of-000163.safetensors", "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.shared_experts.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.shared_experts.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.0.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.0.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.0.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.0.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.0.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.1.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.1.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.1.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.1.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.1.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.2.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.2.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.2.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.2.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.2.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.3.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.3.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.3.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.3.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.3.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.4.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.4.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.4.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.4.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.4.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.5.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.5.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.5.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.5.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.5.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.6.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.6.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.6.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.6.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.6.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.7.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.7.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.7.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.7.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.7.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.8.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.8.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.8.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.8.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.8.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.9.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.9.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.9.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.9.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.9.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.10.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.10.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.10.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.10.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.10.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.11.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.11.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.11.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.11.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.11.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.12.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.12.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.12.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.12.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.12.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.13.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.13.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.13.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.13.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.13.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.14.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.14.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.14.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.14.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.14.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.15.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.15.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.15.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.15.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.15.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.16.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.16.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.16.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.16.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.16.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.17.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.17.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.17.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.17.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.17.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.18.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.18.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.18.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.18.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.18.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.19.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.19.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.19.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.19.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.19.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.20.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.20.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.20.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.20.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.20.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.21.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.21.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.21.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.21.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.21.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.22.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.22.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.22.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.22.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.22.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.23.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.23.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.23.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.23.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.23.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.24.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.24.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.24.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.24.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.24.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.25.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.25.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.25.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.25.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.25.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.26.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.26.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.26.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.26.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.26.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.27.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.27.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.27.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.27.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.27.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.28.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.28.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.28.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.28.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.28.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.29.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.29.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.29.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.29.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.29.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.30.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.30.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.30.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.30.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.30.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.31.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.31.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.31.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.31.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.31.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.32.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.32.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.32.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.32.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.32.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.33.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.33.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.33.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.33.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.33.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.34.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.34.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.34.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.34.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.34.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.35.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.35.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.35.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.35.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.35.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.36.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.36.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.36.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.36.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.36.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.37.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.37.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.37.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.37.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.37.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.38.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.38.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.38.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.38.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.38.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.39.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.39.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.39.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.39.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.39.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.40.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.40.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.40.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.40.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.40.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.41.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.41.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.41.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.41.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.41.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.42.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.42.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.42.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.42.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.42.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.43.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.43.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.43.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.43.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.43.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.44.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.44.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.44.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.44.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.44.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.45.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.45.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.45.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.45.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.45.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.46.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.46.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.46.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.46.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.46.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.47.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.47.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.47.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.47.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.47.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.48.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.48.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.48.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.48.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.48.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.49.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.49.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.49.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.49.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.49.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.50.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.50.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.50.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.50.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.50.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.51.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.51.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.51.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.51.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.51.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.52.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.52.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.52.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.52.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.52.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.53.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.53.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.53.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.53.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.53.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.54.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.54.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.54.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.54.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.54.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.55.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.55.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.55.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.55.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.55.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.56.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.56.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.56.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.56.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.56.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.57.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.57.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.57.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.57.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.57.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.58.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.58.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.58.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.58.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.58.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.59.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.59.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.59.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.59.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.59.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.60.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.60.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.60.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.60.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.60.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.61.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.61.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.61.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.61.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.61.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.62.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.62.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.62.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.62.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.62.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.63.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.63.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.63.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.63.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.63.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.64.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.64.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.64.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.64.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.64.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.65.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.65.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.65.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.65.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.65.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.66.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.66.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.66.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.66.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.66.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.67.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.67.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.67.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.67.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.67.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.68.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.68.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.68.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.68.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.68.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.69.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.69.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.69.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.69.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.69.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.70.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.70.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.70.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.70.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.70.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.71.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.71.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.71.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.71.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.71.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.72.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.72.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.72.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.72.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.72.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.73.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.73.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.73.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.73.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.73.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.74.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.74.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.74.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.74.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.74.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.75.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.75.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.75.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.75.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.75.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.76.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.76.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.76.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.76.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.76.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.77.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.77.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.77.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.77.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.77.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.78.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.78.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.78.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.78.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.78.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.79.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.79.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.79.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.79.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.79.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.80.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.80.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.80.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.80.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.80.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.81.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.81.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.81.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.81.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.81.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.82.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.82.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.82.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.82.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.82.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.83.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.83.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.83.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.83.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.83.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.84.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.84.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.84.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.84.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.84.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.85.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.85.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.85.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.85.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.85.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.86.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.86.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.86.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.86.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.86.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.87.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.87.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.87.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.87.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.87.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.88.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.88.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.88.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.88.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.88.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.89.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.89.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.89.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.89.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.89.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.90.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.90.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.90.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.90.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.90.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.91.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.91.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.91.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.91.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.91.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.92.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.92.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.92.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.92.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.92.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.93.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.93.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.93.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.93.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.93.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.94.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.94.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.94.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.94.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.94.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.95.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.95.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.95.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.95.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.95.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.96.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.96.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.96.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.96.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.96.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.97.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.97.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.97.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.97.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.97.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.98.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.98.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.98.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.98.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.98.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.99.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.99.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.99.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.99.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.99.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.100.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.100.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.100.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.100.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.100.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.101.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.101.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.101.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.101.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.101.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.102.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.102.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.102.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.102.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.102.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.103.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.103.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.103.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.103.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.103.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.104.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.104.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.104.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.104.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.104.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.105.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.105.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.105.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.105.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.105.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.106.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.106.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.106.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.106.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.106.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.107.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.107.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.107.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.107.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.107.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.108.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.108.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.108.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.108.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.108.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.109.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.109.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.109.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.109.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.109.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.110.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.110.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.110.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.110.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.110.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.111.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.111.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.111.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.111.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.111.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.112.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.112.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.112.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.112.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.112.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.113.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.113.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.113.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.113.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.113.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.114.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.114.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.114.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.114.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.114.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.115.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.115.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.115.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.115.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.115.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.116.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.116.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.116.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.116.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.116.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.117.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.117.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.117.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.117.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.117.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.118.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.118.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.118.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.118.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.118.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.119.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.119.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.119.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.119.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.119.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.120.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.120.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.120.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.120.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.120.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.121.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.121.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.121.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.121.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.121.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.122.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.122.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.122.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.122.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.122.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.123.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.123.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.123.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.123.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.123.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.124.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.124.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.124.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.124.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.124.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.125.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.125.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.125.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.125.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.125.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.126.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.126.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.126.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.126.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.126.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.127.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.127.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.127.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.127.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.127.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.128.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.128.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.128.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.128.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.128.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.129.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.129.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.129.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.129.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.129.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.130.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.130.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.130.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.130.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.130.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.131.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.131.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.131.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.131.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.131.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.132.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.132.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.132.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.132.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.132.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.133.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.133.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.133.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.133.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.133.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.134.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.134.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.134.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.134.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.134.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.135.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.135.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.135.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.135.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.135.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.136.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.136.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.136.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.136.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.136.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.137.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.137.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.137.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.137.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.137.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.138.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.138.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.138.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.138.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.138.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.139.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.139.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.139.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.139.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.139.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.140.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.140.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.140.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.140.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.140.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.141.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.141.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.141.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.141.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.141.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.142.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.142.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.142.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.142.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.142.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.143.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.143.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.143.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.143.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.143.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.144.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.144.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.144.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.144.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.144.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.145.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.145.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.145.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.145.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.145.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.146.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.146.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.146.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.146.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.146.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.147.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.147.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.147.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.147.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.147.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.148.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.148.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.148.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.148.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.148.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.149.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.149.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.149.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.149.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.149.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.150.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.150.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.150.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.150.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.150.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.151.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.151.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.151.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.151.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.151.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.152.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.152.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.152.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.152.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.152.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.153.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.153.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.153.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.153.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.153.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.154.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.154.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.154.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.154.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.154.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.155.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.155.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.155.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.155.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.155.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.156.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.156.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.156.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.156.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.156.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.157.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.157.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.157.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.157.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.157.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.158.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.158.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.158.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.158.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.158.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.159.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.159.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.159.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.159.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.159.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.160.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.160.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.160.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.160.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.160.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.160.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.161.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.161.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.161.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.161.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.161.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.161.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.162.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.162.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.162.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.162.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.162.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.162.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.163.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.163.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.163.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.163.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.163.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.163.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.164.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.164.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.164.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.164.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.164.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.164.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.165.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.165.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.165.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.165.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.165.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.165.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.166.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.166.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.166.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.166.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.166.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.166.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.167.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.167.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.167.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.167.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.167.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.167.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.168.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.168.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.168.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.168.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.168.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.168.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.169.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.169.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.169.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.169.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.169.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.169.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.170.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.170.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.170.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.170.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.170.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.170.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.171.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.171.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.171.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.171.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.171.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.171.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.172.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.172.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.172.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.172.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.172.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.172.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.173.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.173.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.173.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.173.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.173.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.173.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.174.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.174.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.174.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.174.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.174.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.174.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.175.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.175.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.175.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.175.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.175.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.175.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.176.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.176.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.176.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.176.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.176.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.176.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.177.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.177.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.177.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.177.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.177.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.177.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.178.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.178.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.178.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.178.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.178.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.178.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.179.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.179.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.179.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.179.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.179.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.179.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.180.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.180.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.180.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.180.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.180.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.180.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.181.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.181.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.181.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.181.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.181.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.181.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.182.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.182.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.182.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.182.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.182.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.182.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.183.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.183.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.183.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.183.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.183.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.183.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.184.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.184.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.184.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.184.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.184.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.184.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.185.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.185.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.185.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.185.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.185.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.185.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.186.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.186.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.186.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.186.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.186.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.186.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.187.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.187.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.187.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.187.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.187.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.187.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.188.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.188.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.188.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.188.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.188.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.188.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.189.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.189.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.189.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.189.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.189.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.189.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.190.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.190.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.190.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.190.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.190.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.190.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.191.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.191.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.191.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.191.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.191.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.191.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.192.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.192.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.192.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.192.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.192.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.192.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.193.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.193.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.193.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.193.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.193.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.193.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.194.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.194.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.194.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.194.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.194.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.194.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.195.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.195.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.195.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.195.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.195.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.195.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.196.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.196.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.196.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.196.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.196.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.196.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.197.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.197.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.197.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.197.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.197.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.197.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.198.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.198.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.198.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.198.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.198.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.198.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.199.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.199.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.199.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.199.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.199.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.199.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.200.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.200.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.200.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.200.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.200.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.200.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.201.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.201.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.201.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.201.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.201.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.201.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.202.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.202.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.202.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.202.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.202.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.202.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.203.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.203.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.203.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.203.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.203.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.203.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.204.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.204.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.204.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.204.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.204.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.204.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.205.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.205.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.205.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.205.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.205.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.205.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.206.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.206.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.206.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.206.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.206.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.206.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.207.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.207.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.207.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.207.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.207.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.207.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.208.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.208.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.208.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.208.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.208.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.208.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.209.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.209.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.209.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.209.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.209.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.209.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.210.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.210.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.210.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.210.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.210.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.210.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.211.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.211.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.211.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.211.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.211.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.211.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.212.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.212.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.212.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.212.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.212.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.212.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.213.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.213.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.213.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.213.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.213.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.213.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.214.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.214.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.214.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.214.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.214.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.214.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.215.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.215.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.215.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.215.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.215.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.215.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.216.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.216.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.216.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.216.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.216.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.216.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.217.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.217.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.217.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.217.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.217.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.217.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.218.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.218.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.218.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.218.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.218.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.218.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.219.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.219.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.219.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.219.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.219.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.219.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.220.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.220.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.220.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.220.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.220.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.220.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.221.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.221.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.221.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.221.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.221.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.221.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.222.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.222.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.222.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.222.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.222.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.222.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.223.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.223.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.223.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.223.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.223.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.223.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.224.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.224.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.224.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.224.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.224.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.224.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.225.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.225.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.225.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.225.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.225.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.225.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.226.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.226.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.226.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.226.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.226.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.226.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.227.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.227.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.227.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.227.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.227.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.227.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.228.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.228.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.228.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.228.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.228.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.228.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.229.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.229.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.229.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.229.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.229.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.229.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.230.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.230.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.230.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.230.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.230.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.230.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.231.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.231.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.231.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.231.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.231.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.231.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.232.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.232.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.232.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.232.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.232.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.232.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.233.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.233.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.233.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.233.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.233.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.233.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.234.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.234.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.234.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.234.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.234.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.234.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.235.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.235.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.235.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.235.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.235.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.235.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.236.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.236.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.236.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.236.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.236.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.236.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.237.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.237.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.237.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.237.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.237.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.237.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.238.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.238.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.238.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.238.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.238.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.238.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.239.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.239.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.239.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.239.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.239.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.239.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.240.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.240.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.240.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.240.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.240.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.240.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.241.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.241.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.241.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.241.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.241.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.241.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.242.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.242.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.242.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.242.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.242.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.242.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.243.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.243.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.243.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.243.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.243.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.243.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.244.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.244.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.244.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.244.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.244.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.244.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.245.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.245.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.245.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.245.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.245.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.245.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.246.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.246.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.246.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.246.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.246.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.246.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.247.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.247.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.247.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.247.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.247.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.247.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.248.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.248.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.248.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.248.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.248.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.248.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.249.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.249.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.249.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.249.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.249.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.249.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.250.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.250.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.250.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.250.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.250.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.250.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.251.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.251.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.251.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.251.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.251.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.251.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.252.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.252.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.252.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.252.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.252.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.252.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.253.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.253.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.253.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.253.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.253.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.253.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.254.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.254.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.254.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.254.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.254.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.254.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.255.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.255.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.255.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.255.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.255.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.255.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.input_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.8.post_attention_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.q_a_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.q_a_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.q_a_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.q_b_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.q_b_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.kv_b_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.kv_b_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.o_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.gate.weight": "model-00018-of-000163.safetensors", "model.layers.9.mlp.gate.e_score_correction_bias": "model-00018-of-000163.safetensors", "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.shared_experts.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.shared_experts.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.0.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.0.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.0.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.0.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.0.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.1.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.1.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.1.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.1.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.1.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.2.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.2.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.2.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.2.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.2.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.3.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.3.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.3.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.3.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.3.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.4.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.4.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.4.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.4.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.4.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.5.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.5.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.5.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.5.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.5.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.6.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.6.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.6.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.6.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.6.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.7.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.7.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.7.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.7.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.7.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.8.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.8.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.8.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.8.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.8.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.9.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.9.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.9.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.9.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.9.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.10.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.10.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.10.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.10.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.10.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.11.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.11.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.11.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.11.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.11.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.12.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.12.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.12.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.12.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.12.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.13.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.13.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.13.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.13.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.13.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.14.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.14.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.14.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.14.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.14.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.15.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.15.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.15.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.15.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.15.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.16.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.16.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.16.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.16.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.16.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.17.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.17.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.17.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.17.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.17.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.18.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.18.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.18.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.18.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.18.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.19.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.19.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.19.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.19.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.19.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.20.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.20.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.20.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.20.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.20.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.21.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.21.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.21.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.21.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.21.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.22.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.22.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.22.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.22.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.22.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.23.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.23.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.23.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.23.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.23.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.24.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.24.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.24.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.24.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.24.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.25.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.25.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.25.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.25.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.25.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.26.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.26.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.26.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.26.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.26.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.27.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.27.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.27.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.27.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.27.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.28.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.28.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.28.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.28.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.28.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.29.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.29.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.29.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.29.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.29.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.30.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.30.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.30.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.30.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.30.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.31.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.31.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.31.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.31.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.31.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.32.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.32.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.32.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.32.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.32.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.33.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.33.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.33.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.33.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.33.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.34.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.34.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.34.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.34.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.34.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.35.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.35.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.35.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.35.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.35.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.36.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.36.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.36.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.36.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.36.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.37.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.37.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.37.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.37.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.37.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.38.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.38.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.38.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.38.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.38.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.39.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.39.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.39.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.39.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.39.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.40.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.40.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.40.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.40.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.40.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.41.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.41.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.41.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.41.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.41.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.42.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.42.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.42.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.42.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.42.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.43.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.43.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.43.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.43.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.43.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.44.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.44.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.44.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.44.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.44.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.45.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.45.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.45.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.45.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.45.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.46.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.46.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.46.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.46.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.46.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.47.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.47.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.47.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.47.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.47.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.48.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.48.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.48.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.48.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.48.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.49.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.49.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.49.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.49.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.49.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.50.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.50.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.50.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.50.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.50.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.51.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.51.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.51.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.51.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.51.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.52.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.52.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.52.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.52.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.52.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.53.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.53.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.53.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.53.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.53.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.54.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.54.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.54.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.54.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.54.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.55.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.55.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.55.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.55.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.55.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.56.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.56.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.56.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.56.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.56.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.57.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.57.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.57.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.57.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.57.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.58.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.58.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.58.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.58.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.58.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.59.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.59.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.59.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.59.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.59.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.60.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.60.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.60.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.60.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.60.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.61.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.61.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.61.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.61.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.61.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.62.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.62.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.62.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.62.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.62.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.63.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.63.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.63.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.63.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.63.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.64.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.64.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.64.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.64.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.64.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.65.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.65.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.65.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.65.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.65.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.66.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.66.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.66.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.66.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.66.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.67.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.67.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.67.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.67.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.67.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.68.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.68.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.68.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.68.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.68.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.69.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.69.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.69.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.69.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.69.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.70.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.70.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.70.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.70.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.70.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.71.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.71.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.71.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.71.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.71.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.72.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.72.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.72.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.72.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.72.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.73.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.73.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.73.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.73.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.73.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.74.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.74.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.74.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.74.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.74.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.75.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.75.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.75.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.75.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.75.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.76.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.76.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.76.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.76.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.76.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.77.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.77.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.77.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.77.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.77.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.78.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.78.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.78.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.78.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.78.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.79.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.79.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.79.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.79.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.79.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.80.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.80.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.80.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.80.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.80.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.81.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.81.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.81.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.81.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.81.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.82.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.82.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.82.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.82.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.82.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.83.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.83.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.83.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.83.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.83.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.84.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.84.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.84.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.84.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.84.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.85.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.85.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.85.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.85.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.85.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.86.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.86.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.86.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.86.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.86.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.87.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.87.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.87.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.87.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.87.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.88.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.88.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.88.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.88.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.88.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.89.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.89.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.89.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.89.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.89.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.90.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.90.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.90.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.90.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.90.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.91.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.91.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.91.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.91.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.91.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.92.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.92.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.92.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.92.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.92.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.93.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.93.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.93.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.93.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.93.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.94.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.94.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.94.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.94.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.94.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.95.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.95.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.95.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.95.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.95.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.96.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.96.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.96.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.96.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.96.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.97.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.97.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.97.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.97.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.97.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.98.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.98.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.98.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.98.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.98.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.99.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.99.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.99.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.99.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.99.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.100.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.100.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.100.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.100.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.100.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.101.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.101.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.101.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.101.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.101.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.102.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.102.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.102.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.102.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.102.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.103.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.103.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.103.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.103.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.103.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.104.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.104.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.104.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.104.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.104.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.105.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.105.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.105.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.105.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.105.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.106.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.106.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.106.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.106.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.106.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.107.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.107.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.107.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.107.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.107.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.108.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.108.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.108.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.108.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.108.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.109.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.109.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.109.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.109.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.109.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.110.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.110.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.110.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.110.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.110.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.111.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.111.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.111.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.111.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.111.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.112.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.112.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.112.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.112.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.112.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.113.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.113.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.113.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.113.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.113.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.114.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.114.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.114.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.114.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.114.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.115.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.115.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.115.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.115.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.115.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.116.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.116.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.116.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.116.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.116.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.117.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.117.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.117.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.117.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.117.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.118.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.118.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.118.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.118.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.118.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.119.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.119.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.119.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.119.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.119.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.120.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.120.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.120.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.120.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.120.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.121.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.121.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.121.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.121.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.121.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.122.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.122.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.122.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.122.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.122.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.123.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.123.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.123.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.123.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.123.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.124.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.124.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.124.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.124.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.124.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.125.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.125.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.125.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.125.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.125.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.126.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.126.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.126.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.126.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.126.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.127.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.127.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.127.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.127.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.127.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.128.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.128.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.128.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.128.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.128.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.129.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.129.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.129.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.129.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.129.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.130.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.130.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.130.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.130.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.130.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.131.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.131.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.131.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.131.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.131.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.132.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.132.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.132.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.132.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.132.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.133.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.133.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.133.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.133.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.133.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.134.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.134.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.134.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.134.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.134.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.135.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.135.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.135.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.135.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.135.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.136.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.136.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.136.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.136.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.136.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.137.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.137.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.137.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.137.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.137.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.138.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.138.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.138.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.138.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.138.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.139.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.139.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.139.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.139.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.139.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.140.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.140.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.140.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.140.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.140.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.141.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.141.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.141.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.141.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.141.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.142.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.142.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.142.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.142.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.142.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.143.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.143.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.143.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.143.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.143.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.144.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.144.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.144.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.144.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.144.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.145.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.145.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.145.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.145.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.145.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.146.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.146.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.146.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.146.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.146.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.147.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.147.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.147.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.147.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.147.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.148.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.148.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.148.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.148.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.148.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.149.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.149.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.149.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.149.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.149.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.150.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.150.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.150.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.150.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.150.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.151.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.151.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.151.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.151.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.151.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.152.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.152.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.152.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.152.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.152.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.153.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.153.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.153.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.153.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.153.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.154.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.154.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.154.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.154.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.154.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.155.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.155.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.155.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.155.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.155.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.156.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.156.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.156.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.156.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.156.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.157.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.157.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.157.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.157.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.157.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.158.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.158.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.158.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.158.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.158.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.159.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.159.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.159.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.159.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.159.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.160.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.160.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.160.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.160.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.160.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.160.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.161.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.161.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.161.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.161.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.161.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.161.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.162.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.162.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.162.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.162.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.162.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.162.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.163.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.163.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.163.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.163.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.163.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.163.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.164.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.164.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.164.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.164.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.164.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.164.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.165.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.165.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.165.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.165.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.165.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.165.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.166.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.166.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.166.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.166.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.166.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.166.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.167.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.167.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.167.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.167.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.167.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.167.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.168.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.168.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.168.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.168.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.168.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.168.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.169.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.169.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.169.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.169.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.169.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.169.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.170.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.170.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.170.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.170.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.170.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.170.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.171.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.171.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.171.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.171.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.171.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.171.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.172.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.172.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.172.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.172.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.172.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.172.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.173.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.173.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.173.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.173.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.173.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.173.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.174.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.174.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.174.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.174.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.174.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.174.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.175.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.175.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.175.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.175.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.175.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.175.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.176.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.176.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.176.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.176.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.176.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.176.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.177.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.177.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.177.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.177.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.177.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.177.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.178.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.178.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.178.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.178.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.178.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.178.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.179.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.179.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.179.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.179.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.179.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.179.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.180.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.180.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.180.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.180.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.180.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.180.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.181.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.181.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.181.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.181.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.181.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.181.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.182.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.182.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.182.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.182.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.182.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.182.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.183.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.183.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.183.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.183.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.183.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.183.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.184.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.184.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.184.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.184.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.184.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.184.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.185.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.185.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.185.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.185.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.185.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.185.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.186.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.186.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.186.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.186.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.186.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.186.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.187.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.187.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.187.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.187.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.187.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.187.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.188.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.188.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.188.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.188.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.188.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.188.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.189.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.189.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.189.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.189.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.189.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.189.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.190.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.190.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.190.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.190.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.190.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.190.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.191.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.191.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.191.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.191.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.191.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.191.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.192.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.192.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.192.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.192.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.192.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.192.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.193.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.193.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.193.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.193.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.193.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.193.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.194.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.194.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.194.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.194.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.194.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.194.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.195.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.195.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.195.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.195.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.195.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.195.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.196.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.196.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.196.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.196.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.196.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.196.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.197.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.197.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.197.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.197.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.197.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.197.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.198.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.198.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.198.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.198.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.198.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.198.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.199.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.199.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.199.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.199.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.199.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.199.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.200.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.200.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.200.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.200.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.200.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.200.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.201.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.201.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.201.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.201.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.201.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.201.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.202.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.202.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.202.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.202.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.202.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.202.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.203.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.203.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.203.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.203.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.203.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.203.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.204.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.204.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.204.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.204.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.204.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.204.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.205.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.205.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.205.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.205.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.205.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.205.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.206.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.206.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.206.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.206.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.206.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.206.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.207.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.207.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.207.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.207.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.207.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.207.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.208.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.208.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.208.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.208.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.208.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.208.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.209.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.209.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.209.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.209.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.209.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.209.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.210.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.210.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.210.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.210.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.210.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.210.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.211.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.211.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.211.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.211.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.211.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.211.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.212.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.212.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.212.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.212.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.212.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.212.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.213.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.213.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.213.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.213.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.213.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.213.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.214.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.214.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.214.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.214.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.214.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.214.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.215.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.215.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.215.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.215.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.215.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.215.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.216.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.216.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.216.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.216.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.216.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.216.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.217.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.217.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.217.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.217.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.217.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.217.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.218.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.218.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.218.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.218.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.218.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.218.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.219.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.219.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.219.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.219.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.219.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.219.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.220.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.220.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.220.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.220.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.220.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.220.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.221.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.221.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.221.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.221.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.221.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.221.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.222.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.222.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.222.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.222.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.222.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.222.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.223.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.223.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.223.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.223.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.223.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.223.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.224.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.224.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.224.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.224.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.224.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.224.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.225.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.225.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.225.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.225.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.225.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.225.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.226.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.226.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.226.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.226.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.226.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.226.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.227.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.227.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.227.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.227.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.227.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.227.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.228.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.228.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.228.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.228.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.228.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.228.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.229.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.229.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.229.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.229.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.229.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.229.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.230.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.230.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.230.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.230.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.230.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.230.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.231.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.231.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.231.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.231.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.231.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.231.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.232.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.232.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.232.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.232.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.232.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.232.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.233.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.233.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.233.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.233.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.233.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.233.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.234.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.234.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.234.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.234.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.234.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.234.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.235.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.235.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.235.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.235.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.235.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.235.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.236.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.236.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.236.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.236.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.236.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.236.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.237.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.237.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.237.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.237.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.237.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.237.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.238.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.238.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.238.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.238.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.238.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.238.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.239.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.239.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.239.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.239.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.239.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.239.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.240.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.240.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.240.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.240.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.240.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.240.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.241.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.241.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.241.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.241.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.241.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.241.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.242.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.242.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.242.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.242.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.242.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.242.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.243.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.243.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.243.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.243.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.243.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.243.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.244.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.244.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.244.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.244.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.244.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.244.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.245.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.245.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.245.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.245.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.245.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.245.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.246.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.246.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.246.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.246.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.246.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.246.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.247.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.247.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.247.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.247.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.247.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.247.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.248.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.248.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.248.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.248.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.248.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.248.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.249.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.249.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.249.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.249.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.249.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.249.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.250.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.250.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.250.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.250.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.250.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.250.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.251.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.251.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.251.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.251.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.251.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.251.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.252.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.252.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.252.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.252.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.252.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.252.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.253.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.253.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.253.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.253.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.253.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.253.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.254.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.254.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.254.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.254.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.254.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.254.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.255.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.255.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.255.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.255.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.255.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.255.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.input_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.9.post_attention_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.q_a_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.q_a_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.q_a_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.q_b_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.q_b_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.kv_b_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.kv_b_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.o_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.gate.weight": "model-00021-of-000163.safetensors", "model.layers.10.mlp.gate.e_score_correction_bias": "model-00021-of-000163.safetensors", "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.shared_experts.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.shared_experts.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.0.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.0.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.0.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.0.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.0.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.1.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.1.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.1.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.1.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.1.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.2.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.2.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.2.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.2.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.2.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.3.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.3.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.3.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.3.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.3.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.4.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.4.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.4.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.4.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.4.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.5.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.5.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.5.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.5.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.5.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.6.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.6.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.6.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.6.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.6.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.7.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.7.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.7.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.7.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.7.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.8.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.8.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.8.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.8.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.8.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.9.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.9.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.9.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.9.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.9.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.10.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.10.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.10.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.10.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.10.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.11.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.11.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.11.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.11.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.11.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.12.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.12.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.12.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.12.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.12.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.13.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.13.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.13.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.13.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.13.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.14.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.14.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.14.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.14.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.14.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.15.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.15.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.15.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.15.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.15.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.16.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.16.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.16.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.16.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.16.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.17.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.17.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.17.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.17.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.17.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.18.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.18.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.18.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.18.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.18.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.19.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.19.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.19.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.19.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.19.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.20.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.20.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.20.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.20.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.20.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.21.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.21.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.21.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.21.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.21.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.22.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.22.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.22.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.22.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.22.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.23.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.23.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.23.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.23.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.23.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.24.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.24.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.24.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.24.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.24.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.25.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.25.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.25.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.25.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.25.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.26.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.26.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.26.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.26.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.26.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.27.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.27.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.27.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.27.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.27.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.28.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.28.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.28.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.28.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.28.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.29.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.29.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.29.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.29.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.29.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.30.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.30.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.30.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.30.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.30.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.31.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.31.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.31.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.31.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.31.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.32.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.32.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.32.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.32.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.32.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.33.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.33.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.33.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.33.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.33.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.34.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.34.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.34.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.34.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.34.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.35.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.35.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.35.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.35.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.35.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.36.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.36.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.36.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.36.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.36.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.37.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.37.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.37.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.37.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.37.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.38.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.38.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.38.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.38.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.38.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.39.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.39.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.39.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.39.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.39.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.40.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.40.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.40.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.40.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.40.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.41.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.41.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.41.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.41.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.41.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.42.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.42.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.42.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.42.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.42.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.43.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.43.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.43.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.43.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.43.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.44.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.44.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.44.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.44.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.44.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.45.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.45.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.45.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.45.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.45.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.46.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.46.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.46.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.46.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.46.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.47.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.47.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.47.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.47.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.47.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.48.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.48.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.48.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.48.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.48.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.49.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.49.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.49.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.49.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.49.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.50.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.50.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.50.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.50.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.50.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.51.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.51.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.51.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.51.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.51.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.52.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.52.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.52.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.52.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.52.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.53.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.53.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.53.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.53.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.53.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.54.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.54.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.54.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.54.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.54.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.55.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.55.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.55.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.55.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.55.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.56.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.56.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.56.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.56.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.56.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.57.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.57.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.57.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.57.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.57.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.58.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.58.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.58.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.58.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.58.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.59.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.59.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.59.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.59.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.59.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.60.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.60.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.60.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.60.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.60.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.61.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.61.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.61.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.61.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.61.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.62.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.62.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.62.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.62.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.62.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.63.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.63.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.63.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.63.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.63.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.64.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.64.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.64.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.64.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.64.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.65.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.65.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.65.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.65.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.65.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.66.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.66.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.66.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.66.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.66.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.67.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.67.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.67.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.67.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.67.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.68.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.68.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.68.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.68.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.68.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.69.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.69.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.69.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.69.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.69.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.70.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.70.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.70.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.70.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.70.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.71.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.71.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.71.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.71.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.71.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.72.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.72.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.72.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.72.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.72.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.73.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.73.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.73.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.73.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.73.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.74.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.74.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.74.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.74.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.74.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.75.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.75.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.75.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.75.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.75.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.76.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.76.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.76.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.76.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.76.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.77.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.77.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.77.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.77.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.77.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.78.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.78.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.78.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.78.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.78.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.79.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.79.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.79.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.79.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.79.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.80.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.80.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.80.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.80.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.80.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.81.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.81.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.81.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.81.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.81.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.82.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.82.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.82.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.82.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.82.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.83.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.83.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.83.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.83.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.83.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.84.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.84.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.84.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.84.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.84.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.85.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.85.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.85.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.85.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.85.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.86.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.86.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.86.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.86.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.86.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.87.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.87.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.87.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.87.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.87.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.88.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.88.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.88.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.88.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.88.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.89.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.89.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.89.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.89.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.89.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.90.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.90.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.90.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.90.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.90.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.91.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.91.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.91.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.91.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.91.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.92.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.92.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.92.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.92.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.92.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.93.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.93.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.93.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.93.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.93.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.94.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.94.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.94.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.94.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.94.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.95.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.95.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.95.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.95.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.95.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.96.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.96.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.96.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.96.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.96.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.97.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.97.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.97.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.97.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.97.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.98.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.98.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.98.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.98.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.98.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.99.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.99.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.99.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.99.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.99.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.100.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.100.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.100.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.100.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.100.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.101.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.101.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.101.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.101.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.101.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.102.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.102.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.102.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.102.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.102.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.103.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.103.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.103.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.103.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.103.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.104.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.104.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.104.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.104.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.104.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.105.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.105.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.105.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.105.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.105.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.106.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.106.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.106.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.106.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.106.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.107.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.107.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.107.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.107.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.107.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.108.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.108.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.108.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.108.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.108.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.109.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.109.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.109.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.109.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.109.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.110.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.110.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.110.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.110.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.110.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.111.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.111.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.111.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.111.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.111.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.112.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.112.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.112.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.112.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.112.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.113.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.113.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.113.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.113.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.113.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.114.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.114.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.114.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.114.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.114.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.115.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.115.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.115.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.115.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.115.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.116.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.116.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.116.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.116.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.116.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.117.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.117.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.117.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.117.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.117.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.118.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.118.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.118.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.118.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.118.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.119.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.119.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.119.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.119.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.119.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.120.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.120.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.120.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.120.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.120.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.121.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.121.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.121.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.121.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.121.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.122.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.122.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.122.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.122.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.122.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.123.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.123.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.123.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.123.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.123.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.124.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.124.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.124.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.124.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.124.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.125.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.125.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.125.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.125.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.125.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.126.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.126.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.126.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.126.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.126.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.127.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.127.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.127.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.127.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.127.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.128.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.128.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.128.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.128.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.128.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.129.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.129.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.129.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.129.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.129.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.130.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.130.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.130.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.130.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.130.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.131.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.131.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.131.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.131.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.131.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.132.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.132.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.132.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.132.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.132.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.133.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.133.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.133.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.133.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.133.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.134.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.134.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.134.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.134.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.134.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.135.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.135.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.135.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.135.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.135.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.136.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.136.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.136.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.136.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.136.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.137.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.137.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.137.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.137.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.137.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.138.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.138.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.138.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.138.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.138.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.139.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.139.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.139.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.139.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.139.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.140.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.140.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.140.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.140.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.140.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.141.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.141.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.141.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.141.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.141.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.142.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.142.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.142.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.142.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.142.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.143.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.143.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.143.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.143.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.143.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.144.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.144.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.144.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.144.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.144.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.145.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.145.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.145.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.145.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.145.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.146.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.146.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.146.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.146.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.146.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.147.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.147.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.147.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.147.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.147.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.148.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.148.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.148.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.148.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.148.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.149.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.149.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.149.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.149.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.149.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.150.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.150.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.150.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.150.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.150.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.151.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.151.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.151.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.151.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.151.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.152.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.152.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.152.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.152.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.152.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.153.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.153.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.153.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.153.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.153.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.154.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.154.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.154.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.154.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.154.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.155.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.155.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.155.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.155.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.155.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.156.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.156.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.156.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.156.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.156.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.157.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.157.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.157.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.157.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.157.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.158.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.158.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.158.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.158.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.158.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.159.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.159.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.159.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.159.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.159.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.160.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.160.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.160.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.160.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.160.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.160.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.161.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.161.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.161.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.161.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.161.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.161.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.162.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.162.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.162.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.162.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.162.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.162.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.163.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.163.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.163.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.163.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.163.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.163.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.164.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.164.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.164.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.164.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.164.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.164.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.165.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.165.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.165.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.165.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.165.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.165.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.166.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.166.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.166.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.166.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.166.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.166.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.167.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.167.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.167.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.167.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.167.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.167.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.168.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.168.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.168.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.168.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.168.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.168.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.169.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.169.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.169.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.169.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.169.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.169.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.170.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.170.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.170.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.170.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.170.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.170.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.171.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.171.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.171.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.171.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.171.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.171.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.172.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.172.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.172.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.172.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.172.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.172.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.173.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.173.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.173.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.173.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.173.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.173.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.174.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.174.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.174.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.174.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.174.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.174.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.175.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.175.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.175.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.175.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.175.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.175.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.176.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.176.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.176.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.176.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.176.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.176.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.177.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.177.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.177.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.177.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.177.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.177.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.178.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.178.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.178.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.178.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.178.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.178.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.179.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.179.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.179.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.179.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.179.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.179.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.180.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.180.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.180.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.180.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.180.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.180.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.181.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.181.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.181.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.181.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.181.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.181.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.182.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.182.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.182.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.182.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.182.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.182.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.183.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.183.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.183.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.183.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.183.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.183.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.184.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.184.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.184.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.184.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.184.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.184.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.185.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.185.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.185.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.185.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.185.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.185.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.186.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.186.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.186.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.186.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.186.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.186.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.187.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.187.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.187.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.187.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.187.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.187.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.188.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.188.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.188.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.188.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.188.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.188.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.189.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.189.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.189.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.189.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.189.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.189.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.190.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.190.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.190.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.190.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.190.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.190.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.191.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.191.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.191.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.191.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.191.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.191.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.192.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.192.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.192.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.192.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.192.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.192.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.193.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.193.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.193.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.193.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.193.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.193.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.194.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.194.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.194.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.194.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.194.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.194.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.195.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.195.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.195.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.195.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.195.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.195.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.196.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.196.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.196.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.196.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.196.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.196.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.197.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.197.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.197.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.197.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.197.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.197.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.198.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.198.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.198.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.198.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.198.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.198.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.199.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.199.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.199.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.199.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.199.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.199.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.200.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.200.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.200.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.200.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.200.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.200.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.201.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.201.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.201.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.201.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.201.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.201.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.202.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.202.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.202.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.202.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.202.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.202.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.203.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.203.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.203.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.203.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.203.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.203.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.204.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.204.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.204.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.204.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.204.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.204.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.205.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.205.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.205.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.205.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.205.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.205.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.206.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.206.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.206.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.206.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.206.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.206.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.207.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.207.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.207.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.207.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.207.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.207.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.208.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.208.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.208.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.208.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.208.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.208.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.209.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.209.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.209.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.209.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.209.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.209.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.210.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.210.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.210.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.210.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.210.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.210.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.211.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.211.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.211.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.211.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.211.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.211.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.212.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.212.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.212.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.212.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.212.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.212.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.213.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.213.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.213.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.213.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.213.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.213.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.214.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.214.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.214.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.214.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.214.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.214.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.215.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.215.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.215.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.215.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.215.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.215.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.216.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.216.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.216.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.216.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.216.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.216.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.217.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.217.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.217.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.217.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.217.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.217.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.218.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.218.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.218.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.218.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.218.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.218.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.219.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.219.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.219.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.219.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.219.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.219.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.220.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.220.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.220.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.220.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.220.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.220.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.221.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.221.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.221.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.221.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.221.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.221.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.222.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.222.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.222.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.222.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.222.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.222.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.223.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.223.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.223.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.223.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.223.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.223.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.224.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.224.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.224.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.224.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.224.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.224.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.225.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.225.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.225.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.225.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.225.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.225.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.226.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.226.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.226.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.226.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.226.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.226.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.227.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.227.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.227.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.227.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.227.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.227.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.228.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.228.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.228.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.228.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.228.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.228.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.229.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.229.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.229.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.229.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.229.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.229.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.230.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.230.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.230.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.230.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.230.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.230.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.231.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.231.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.231.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.231.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.231.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.231.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.232.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.232.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.232.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.232.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.232.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.232.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.233.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.233.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.233.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.233.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.233.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.233.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.234.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.234.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.234.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.234.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.234.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.234.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.235.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.235.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.235.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.235.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.235.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.235.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.236.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.236.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.236.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.236.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.236.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.236.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.237.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.237.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.237.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.237.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.237.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.237.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.238.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.238.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.238.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.238.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.238.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.238.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.239.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.239.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.239.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.239.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.239.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.239.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.240.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.240.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.240.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.240.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.240.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.240.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.241.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.241.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.241.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.241.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.241.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.241.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.242.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.242.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.242.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.242.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.242.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.242.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.243.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.243.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.243.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.243.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.243.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.243.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.244.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.244.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.244.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.244.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.244.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.244.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.245.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.245.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.245.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.245.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.245.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.245.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.246.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.246.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.246.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.246.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.246.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.246.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.247.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.247.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.247.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.247.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.247.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.247.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.248.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.248.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.248.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.248.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.248.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.248.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.249.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.249.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.249.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.249.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.249.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.249.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.250.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.250.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.250.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.250.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.250.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.250.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.251.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.251.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.251.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.251.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.251.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.251.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.252.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.252.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.252.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.252.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.252.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.252.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.253.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.253.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.253.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.253.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.253.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.253.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.254.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.254.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.254.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.254.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.254.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.254.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.255.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.255.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.255.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.255.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.255.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.255.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.input_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.10.post_attention_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.q_a_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.q_a_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.q_a_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.q_b_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.q_b_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.kv_b_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.kv_b_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.o_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.gate.weight": "model-00023-of-000163.safetensors", "model.layers.11.mlp.gate.e_score_correction_bias": "model-00023-of-000163.safetensors", "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.shared_experts.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.shared_experts.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.0.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.0.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.0.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.0.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.0.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.1.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.1.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.1.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.1.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.1.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.2.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.2.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.2.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.2.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.2.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.3.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.3.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.3.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.3.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.3.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.4.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.4.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.4.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.4.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.4.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.5.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.5.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.5.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.5.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.5.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.6.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.6.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.6.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.6.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.6.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.7.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.7.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.7.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.7.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.7.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.8.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.8.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.8.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.8.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.8.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.9.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.9.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.9.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.9.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.9.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.10.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.10.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.10.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.10.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.10.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.11.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.11.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.11.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.11.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.11.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.12.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.12.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.12.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.12.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.12.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.13.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.13.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.13.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.13.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.13.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.14.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.14.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.14.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.14.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.14.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.15.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.15.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.15.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.15.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.15.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.16.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.16.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.16.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.16.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.16.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.17.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.17.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.17.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.17.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.17.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.18.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.18.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.18.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.18.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.18.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.19.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.19.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.19.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.19.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.19.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.20.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.20.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.20.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.20.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.20.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.21.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.21.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.21.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.21.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.21.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.22.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.22.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.22.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.22.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.22.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.23.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.23.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.23.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.23.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.23.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.24.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.24.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.24.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.24.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.24.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.25.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.25.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.25.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.25.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.25.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.26.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.26.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.26.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.26.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.26.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.27.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.27.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.27.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.27.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.27.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.28.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.28.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.28.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.28.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.28.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.29.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.29.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.29.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.29.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.29.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.30.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.30.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.30.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.30.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.30.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.31.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.31.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.31.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.31.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.31.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.32.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.32.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.32.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.32.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.32.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.33.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.33.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.33.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.33.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.33.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.34.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.34.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.34.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.34.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.34.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.35.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.35.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.35.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.35.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.35.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.36.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.36.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.36.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.36.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.36.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.37.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.37.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.37.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.37.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.37.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.38.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.38.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.38.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.38.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.38.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.39.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.39.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.39.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.39.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.39.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.40.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.40.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.40.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.40.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.40.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.41.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.41.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.41.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.41.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.41.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.42.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.42.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.42.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.42.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.42.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.43.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.43.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.43.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.43.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.43.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.44.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.44.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.44.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.44.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.44.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.45.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.45.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.45.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.45.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.45.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.46.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.46.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.46.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.46.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.46.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.47.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.47.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.47.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.47.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.47.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.48.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.48.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.48.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.48.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.48.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.49.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.49.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.49.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.49.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.49.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.50.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.50.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.50.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.50.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.50.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.51.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.51.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.51.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.51.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.51.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.52.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.52.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.52.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.52.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.52.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.53.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.53.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.53.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.53.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.53.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.54.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.54.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.54.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.54.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.54.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.55.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.55.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.55.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.55.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.55.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.56.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.56.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.56.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.56.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.56.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.57.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.57.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.57.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.57.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.57.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.58.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.58.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.58.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.58.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.58.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.59.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.59.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.59.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.59.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.59.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.60.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.60.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.60.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.60.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.60.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.61.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.61.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.61.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.61.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.61.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.62.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.62.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.62.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.62.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.62.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.63.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.63.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.63.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.63.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.63.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.64.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.64.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.64.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.64.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.64.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.65.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.65.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.65.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.65.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.65.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.66.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.66.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.66.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.66.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.66.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.67.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.67.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.67.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.67.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.67.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.68.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.68.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.68.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.68.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.68.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.69.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.69.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.69.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.69.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.69.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.70.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.70.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.70.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.70.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.70.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.71.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.71.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.71.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.71.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.71.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.72.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.72.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.72.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.72.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.72.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.73.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.73.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.73.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.73.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.73.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.74.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.74.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.74.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.74.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.74.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.75.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.75.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.75.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.75.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.75.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.76.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.76.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.76.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.76.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.76.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.77.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.77.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.77.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.77.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.77.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.78.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.78.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.78.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.78.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.78.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.79.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.79.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.79.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.79.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.79.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.80.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.80.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.80.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.80.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.80.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.81.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.81.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.81.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.81.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.81.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.82.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.82.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.82.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.82.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.82.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.83.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.83.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.83.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.83.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.83.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.84.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.84.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.84.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.84.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.84.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.85.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.85.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.85.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.85.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.85.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.86.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.86.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.86.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.86.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.86.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.87.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.87.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.87.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.87.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.87.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.88.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.88.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.88.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.88.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.88.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.89.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.89.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.89.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.89.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.89.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.90.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.90.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.90.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.90.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.90.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.91.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.91.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.91.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.91.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.91.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.92.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.92.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.92.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.92.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.92.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.93.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.93.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.93.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.93.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.93.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.94.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.94.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.94.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.94.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.94.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.95.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.95.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.95.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.95.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.95.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.96.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.96.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.96.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.96.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.96.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.97.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.97.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.97.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.97.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.97.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.98.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.98.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.98.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.98.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.98.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.99.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.99.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.99.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.99.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.99.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.100.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.100.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.100.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.100.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.100.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.101.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.101.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.101.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.101.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.101.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.102.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.102.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.102.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.102.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.102.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.103.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.103.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.103.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.103.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.103.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.104.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.104.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.104.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.104.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.104.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.105.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.105.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.105.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.105.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.105.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.106.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.106.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.106.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.106.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.106.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.107.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.107.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.107.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.107.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.107.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.108.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.108.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.108.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.108.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.108.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.109.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.109.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.109.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.109.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.109.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.110.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.110.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.110.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.110.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.110.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.111.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.111.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.111.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.111.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.111.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.112.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.112.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.112.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.112.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.112.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.113.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.113.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.113.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.113.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.113.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.114.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.114.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.114.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.114.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.114.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.115.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.115.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.115.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.115.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.115.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.116.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.116.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.116.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.116.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.116.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.117.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.117.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.117.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.117.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.117.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.118.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.118.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.118.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.118.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.118.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.119.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.119.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.119.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.119.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.119.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.120.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.120.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.120.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.120.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.120.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.121.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.121.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.121.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.121.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.121.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.122.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.122.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.122.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.122.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.122.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.123.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.123.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.123.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.123.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.123.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.124.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.124.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.124.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.124.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.124.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.125.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.125.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.125.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.125.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.125.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.126.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.126.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.126.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.126.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.126.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.127.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.127.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.127.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.127.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.127.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.128.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.128.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.128.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.128.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.128.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.129.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.129.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.129.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.129.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.129.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.130.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.130.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.130.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.130.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.130.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.131.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.131.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.131.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.131.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.131.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.132.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.132.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.132.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.132.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.132.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.133.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.133.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.133.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.133.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.133.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.134.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.134.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.134.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.134.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.134.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.135.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.135.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.135.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.135.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.135.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.136.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.136.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.136.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.136.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.136.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.137.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.137.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.137.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.137.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.137.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.138.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.138.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.138.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.138.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.138.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.139.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.139.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.139.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.139.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.139.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.140.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.140.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.140.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.140.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.140.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.141.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.141.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.141.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.141.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.141.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.142.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.142.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.142.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.142.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.142.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.143.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.143.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.143.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.143.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.143.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.144.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.144.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.144.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.144.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.144.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.145.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.145.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.145.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.145.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.145.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.146.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.146.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.146.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.146.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.146.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.147.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.147.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.147.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.147.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.147.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.148.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.148.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.148.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.148.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.148.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.149.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.149.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.149.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.149.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.149.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.150.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.150.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.150.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.150.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.150.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.151.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.151.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.151.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.151.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.151.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.152.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.152.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.152.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.152.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.152.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.153.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.153.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.153.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.153.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.153.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.154.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.154.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.154.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.154.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.154.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.155.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.155.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.155.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.155.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.155.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.156.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.156.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.156.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.156.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.156.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.157.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.157.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.157.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.157.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.157.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.158.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.158.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.158.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.158.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.158.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.159.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.159.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.159.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.159.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.159.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.160.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.160.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.160.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.160.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.160.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.160.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.161.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.161.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.161.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.161.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.161.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.161.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.162.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.162.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.162.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.162.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.162.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.162.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.163.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.163.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.163.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.163.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.163.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.163.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.164.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.164.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.164.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.164.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.164.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.164.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.165.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.165.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.165.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.165.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.165.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.165.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.166.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.166.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.166.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.166.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.166.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.166.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.167.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.167.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.167.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.167.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.167.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.167.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.168.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.168.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.168.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.168.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.168.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.168.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.169.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.169.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.169.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.169.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.169.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.169.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.170.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.170.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.170.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.170.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.170.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.170.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.171.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.171.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.171.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.171.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.171.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.171.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.172.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.172.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.172.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.172.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.172.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.172.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.173.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.173.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.173.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.173.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.173.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.173.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.174.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.174.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.174.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.174.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.174.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.174.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.175.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.175.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.175.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.175.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.175.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.175.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.176.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.176.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.176.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.176.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.176.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.176.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.177.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.177.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.177.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.177.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.177.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.177.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.178.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.178.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.178.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.178.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.178.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.178.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.179.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.179.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.179.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.179.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.179.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.179.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.180.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.180.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.180.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.180.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.180.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.180.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.181.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.181.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.181.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.181.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.181.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.181.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.182.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.182.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.182.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.182.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.182.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.182.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.183.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.183.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.183.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.183.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.183.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.183.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.184.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.184.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.184.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.184.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.184.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.184.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.185.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.185.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.185.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.185.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.185.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.185.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.186.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.186.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.186.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.186.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.186.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.186.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.187.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.187.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.187.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.187.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.187.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.187.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.188.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.188.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.188.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.188.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.188.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.188.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.189.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.189.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.189.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.189.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.189.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.189.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.190.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.190.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.190.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.190.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.190.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.190.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.191.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.191.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.191.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.191.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.191.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.191.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.192.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.192.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.192.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.192.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.192.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.192.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.193.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.193.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.193.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.193.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.193.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.193.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.194.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.194.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.194.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.194.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.194.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.194.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.195.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.195.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.195.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.195.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.195.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.195.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.196.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.196.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.196.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.196.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.196.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.196.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.197.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.197.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.197.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.197.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.197.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.197.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.198.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.198.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.198.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.198.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.198.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.198.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.199.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.199.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.199.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.199.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.199.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.199.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.200.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.200.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.200.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.200.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.200.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.200.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.201.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.201.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.201.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.201.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.201.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.201.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.202.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.202.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.202.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.202.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.202.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.202.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.203.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.203.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.203.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.203.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.203.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.203.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.204.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.204.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.204.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.204.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.204.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.204.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.205.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.205.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.205.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.205.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.205.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.205.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.206.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.206.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.206.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.206.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.206.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.206.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.207.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.207.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.207.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.207.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.207.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.207.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.208.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.208.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.208.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.208.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.208.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.208.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.209.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.209.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.209.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.209.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.209.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.209.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.210.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.210.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.210.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.210.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.210.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.210.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.211.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.211.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.211.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.211.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.211.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.211.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.212.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.212.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.212.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.212.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.212.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.212.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.213.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.213.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.213.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.213.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.213.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.213.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.214.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.214.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.214.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.214.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.214.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.214.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.215.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.215.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.215.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.215.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.215.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.215.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.216.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.216.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.216.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.216.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.216.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.216.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.217.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.217.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.217.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.217.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.217.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.217.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.218.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.218.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.218.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.218.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.218.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.218.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.219.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.219.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.219.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.219.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.219.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.219.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.220.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.220.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.220.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.220.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.220.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.220.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.221.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.221.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.221.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.221.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.221.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.221.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.222.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.222.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.222.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.222.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.222.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.222.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.223.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.223.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.223.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.223.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.223.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.223.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.224.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.224.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.224.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.224.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.224.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.224.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.225.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.225.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.225.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.225.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.225.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.225.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.226.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.226.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.226.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.226.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.226.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.226.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.227.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.227.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.227.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.227.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.227.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.227.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.228.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.228.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.228.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.228.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.228.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.228.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.229.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.229.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.229.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.229.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.229.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.229.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.230.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.230.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.230.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.230.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.230.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.230.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.231.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.231.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.231.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.231.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.231.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.231.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.232.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.232.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.232.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.232.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.232.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.232.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.233.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.233.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.233.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.233.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.233.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.233.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.234.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.234.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.234.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.234.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.234.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.234.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.235.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.235.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.235.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.235.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.235.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.235.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.236.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.236.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.236.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.236.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.236.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.236.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.237.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.237.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.237.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.237.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.237.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.237.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.238.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.238.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.238.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.238.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.238.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.238.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.239.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.239.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.239.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.239.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.239.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.239.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.240.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.240.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.240.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.240.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.240.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.240.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.241.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.241.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.241.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.241.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.241.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.241.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.242.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.242.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.242.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.242.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.242.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.242.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.243.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.243.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.243.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.243.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.243.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.243.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.244.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.244.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.244.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.244.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.244.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.244.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.245.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.245.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.245.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.245.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.245.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.245.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.246.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.246.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.246.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.246.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.246.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.246.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.247.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.247.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.247.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.247.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.247.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.247.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.248.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.248.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.248.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.248.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.248.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.248.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.249.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.249.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.249.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.249.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.249.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.249.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.250.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.250.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.250.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.250.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.250.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.250.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.251.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.251.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.251.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.251.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.251.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.251.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.252.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.252.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.252.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.252.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.252.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.252.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.253.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.253.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.253.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.253.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.253.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.253.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.254.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.254.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.254.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.254.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.254.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.254.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.255.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.255.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.255.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.255.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.255.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.255.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.input_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.11.post_attention_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.q_a_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.q_a_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.q_a_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.q_b_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.q_b_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.kv_b_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.kv_b_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.o_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.o_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.gate.weight": "model-00026-of-000163.safetensors", "model.layers.12.mlp.gate.e_score_correction_bias": "model-00026-of-000163.safetensors", "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.shared_experts.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.shared_experts.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.0.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.0.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.0.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.0.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.0.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.1.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.1.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.1.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.1.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.1.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.2.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.2.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.2.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.2.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.2.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.3.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.3.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.3.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.3.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.3.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.4.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.4.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.4.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.4.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.4.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.5.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.5.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.5.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.5.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.5.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.6.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.6.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.6.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.6.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.6.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.7.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.7.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.7.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.7.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.7.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.8.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.8.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.8.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.8.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.8.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.9.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.9.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.9.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.9.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.9.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.10.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.10.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.10.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.10.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.10.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.11.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.11.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.11.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.11.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.11.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.12.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.12.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.12.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.12.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.12.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.13.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.13.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.13.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.13.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.13.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.14.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.14.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.14.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.14.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.14.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.15.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.15.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.15.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.15.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.15.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.16.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.16.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.16.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.16.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.16.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.17.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.17.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.17.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.17.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.17.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.18.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.18.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.18.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.18.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.18.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.19.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.19.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.19.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.19.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.19.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.20.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.20.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.20.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.20.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.20.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.21.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.21.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.21.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.21.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.21.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.22.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.22.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.22.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.22.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.22.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.23.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.23.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.23.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.23.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.23.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.24.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.24.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.24.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.24.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.24.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.25.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.25.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.25.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.25.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.25.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.26.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.26.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.26.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.26.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.26.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.27.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.27.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.27.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.27.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.27.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.28.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.28.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.28.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.28.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.28.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.29.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.29.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.29.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.29.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.29.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.30.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.30.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.30.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.30.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.30.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.31.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.31.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.31.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.31.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.31.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.32.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.32.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.32.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.32.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.32.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.33.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.33.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.33.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.33.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.33.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.34.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.34.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.34.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.34.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.34.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.35.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.35.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.35.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.35.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.35.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.36.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.36.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.36.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.36.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.36.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.37.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.37.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.37.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.37.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.37.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.38.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.38.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.38.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.38.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.38.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.39.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.39.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.39.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.39.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.39.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.40.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.40.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.40.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.40.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.40.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.41.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.41.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.41.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.41.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.41.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.42.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.42.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.42.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.42.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.42.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.43.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.43.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.43.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.43.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.43.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.44.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.44.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.44.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.44.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.44.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.45.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.45.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.45.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.45.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.45.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.46.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.46.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.46.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.46.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.46.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.47.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.47.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.47.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.47.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.47.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.48.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.48.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.48.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.48.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.48.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.49.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.49.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.49.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.49.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.49.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.50.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.50.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.50.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.50.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.50.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.51.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.51.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.51.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.51.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.51.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.52.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.52.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.52.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.52.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.52.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.53.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.53.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.53.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.53.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.53.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.54.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.54.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.54.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.54.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.54.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.55.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.55.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.55.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.55.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.55.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.56.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.56.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.56.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.56.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.56.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.57.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.57.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.57.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.57.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.57.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.58.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.58.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.58.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.58.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.58.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.59.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.59.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.59.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.59.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.59.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.60.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.60.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.60.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.60.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.60.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.61.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.61.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.61.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.61.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.61.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.62.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.62.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.62.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.62.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.62.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.63.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.63.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.63.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.63.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.63.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.64.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.64.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.64.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.64.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.64.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.65.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.65.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.65.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.65.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.65.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.66.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.66.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.66.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.66.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.66.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.67.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.67.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.67.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.67.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.67.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.68.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.68.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.68.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.68.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.68.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.69.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.69.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.69.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.69.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.69.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.70.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.70.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.70.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.70.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.70.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.71.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.71.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.71.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.71.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.71.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.72.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.72.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.72.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.72.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.72.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.73.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.73.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.73.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.73.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.73.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.74.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.74.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.74.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.74.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.74.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.75.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.75.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.75.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.75.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.75.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.76.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.76.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.76.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.76.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.76.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.77.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.77.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.77.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.77.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.77.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.78.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.78.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.78.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.78.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.78.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.79.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.79.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.79.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.79.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.79.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.80.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.80.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.80.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.80.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.80.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.81.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.81.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.81.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.81.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.81.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.82.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.82.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.82.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.82.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.82.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.83.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.83.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.83.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.83.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.83.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.84.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.84.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.84.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.84.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.84.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.85.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.85.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.85.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.85.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.85.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.86.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.86.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.86.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.86.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.86.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.87.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.87.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.87.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.87.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.87.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.88.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.88.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.88.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.88.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.88.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.89.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.89.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.89.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.89.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.89.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.90.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.90.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.90.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.90.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.90.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.91.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.91.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.91.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.91.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.91.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.92.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.92.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.92.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.92.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.92.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.93.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.93.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.93.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.93.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.93.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.94.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.94.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.94.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.94.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.94.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.95.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.95.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.95.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.95.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.95.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.96.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.96.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.96.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.96.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.96.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.97.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.97.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.97.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.97.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.97.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.98.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.98.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.98.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.98.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.98.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.99.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.99.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.99.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.99.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.99.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.100.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.100.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.100.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.100.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.100.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.101.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.101.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.101.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.101.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.101.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.102.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.102.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.102.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.102.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.102.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.103.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.103.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.103.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.103.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.103.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.104.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.104.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.104.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.104.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.104.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.105.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.105.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.105.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.105.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.105.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.106.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.106.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.106.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.106.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.106.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.107.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.107.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.107.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.107.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.107.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.108.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.108.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.108.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.108.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.108.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.109.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.109.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.109.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.109.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.109.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.110.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.110.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.110.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.110.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.110.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.111.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.111.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.111.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.111.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.111.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.112.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.112.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.112.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.112.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.112.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.113.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.113.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.113.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.113.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.113.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.114.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.114.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.114.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.114.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.114.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.115.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.115.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.115.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.115.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.115.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.116.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.116.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.116.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.116.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.116.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.117.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.117.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.117.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.117.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.117.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.118.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.118.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.118.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.118.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.118.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.119.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.119.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.119.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.119.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.119.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.120.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.120.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.120.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.120.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.120.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.121.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.121.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.121.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.121.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.121.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.122.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.122.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.122.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.122.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.122.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.123.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.123.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.123.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.123.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.123.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.124.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.124.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.124.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.124.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.124.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.125.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.125.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.125.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.125.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.125.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.126.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.126.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.126.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.126.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.126.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.127.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.127.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.127.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.127.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.127.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.128.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.128.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.128.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.128.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.128.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.129.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.129.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.129.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.129.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.129.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.130.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.130.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.130.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.130.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.130.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.131.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.131.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.131.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.131.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.131.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.132.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.132.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.132.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.132.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.132.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.133.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.133.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.133.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.133.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.133.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.134.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.134.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.134.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.134.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.134.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.135.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.135.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.135.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.135.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.135.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.136.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.136.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.136.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.136.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.136.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.137.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.137.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.137.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.137.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.137.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.138.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.138.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.138.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.138.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.138.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.139.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.139.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.139.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.139.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.139.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.140.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.140.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.140.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.140.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.140.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.141.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.141.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.141.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.141.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.141.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.142.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.142.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.142.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.142.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.142.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.143.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.143.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.143.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.143.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.143.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.144.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.144.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.144.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.144.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.144.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.145.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.145.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.145.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.145.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.145.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.146.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.146.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.146.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.146.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.146.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.147.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.147.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.147.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.147.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.147.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.148.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.148.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.148.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.148.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.148.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.149.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.149.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.149.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.149.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.149.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.150.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.150.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.150.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.150.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.150.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.151.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.151.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.151.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.151.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.151.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.152.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.152.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.152.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.152.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.152.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.153.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.153.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.153.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.153.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.153.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.154.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.154.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.154.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.154.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.154.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.155.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.155.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.155.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.155.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.155.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.156.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.156.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.156.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.156.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.156.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.157.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.157.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.157.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.157.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.157.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.158.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.158.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.158.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.158.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.158.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.159.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.159.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.159.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.159.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.159.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.160.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.160.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.160.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.160.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.160.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.160.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.161.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.161.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.161.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.161.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.161.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.161.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.162.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.162.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.162.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.162.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.162.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.162.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.163.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.163.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.163.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.163.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.163.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.163.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.164.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.164.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.164.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.164.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.164.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.164.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.165.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.165.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.165.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.165.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.165.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.165.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.166.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.166.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.166.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.166.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.166.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.166.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.167.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.167.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.167.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.167.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.167.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.167.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.168.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.168.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.168.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.168.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.168.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.168.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.169.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.169.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.169.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.169.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.169.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.169.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.170.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.170.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.170.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.170.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.170.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.170.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.171.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.171.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.171.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.171.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.171.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.171.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.172.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.172.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.172.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.172.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.172.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.172.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.173.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.173.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.173.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.173.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.173.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.173.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.174.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.174.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.174.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.174.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.174.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.174.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.175.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.175.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.175.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.175.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.175.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.175.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.176.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.176.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.176.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.176.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.176.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.176.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.177.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.177.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.177.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.177.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.177.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.177.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.178.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.178.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.178.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.178.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.178.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.178.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.179.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.179.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.179.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.179.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.179.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.179.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.180.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.180.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.180.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.180.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.180.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.180.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.181.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.181.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.181.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.181.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.181.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.181.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.182.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.182.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.182.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.182.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.182.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.182.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.183.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.183.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.183.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.183.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.183.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.183.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.184.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.184.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.184.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.184.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.184.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.184.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.185.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.185.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.185.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.185.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.185.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.185.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.186.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.186.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.186.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.186.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.186.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.186.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.187.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.187.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.187.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.187.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.187.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.187.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.188.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.188.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.188.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.188.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.188.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.188.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.189.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.189.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.189.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.189.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.189.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.189.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.190.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.190.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.190.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.190.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.190.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.190.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.191.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.191.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.191.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.191.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.191.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.191.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.192.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.192.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.192.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.192.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.192.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.192.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.193.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.193.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.193.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.193.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.193.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.193.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.194.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.194.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.194.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.194.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.194.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.194.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.195.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.195.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.195.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.195.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.195.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.195.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.196.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.196.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.196.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.196.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.196.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.196.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.197.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.197.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.197.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.197.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.197.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.197.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.198.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.198.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.198.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.198.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.198.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.198.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.199.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.199.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.199.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.199.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.199.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.199.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.200.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.200.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.200.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.200.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.200.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.200.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.201.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.201.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.201.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.201.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.201.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.201.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.202.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.202.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.202.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.202.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.202.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.202.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.203.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.203.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.203.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.203.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.203.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.203.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.204.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.204.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.204.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.204.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.204.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.204.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.205.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.205.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.205.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.205.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.205.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.205.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.206.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.206.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.206.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.206.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.206.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.206.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.207.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.207.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.207.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.207.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.207.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.207.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.208.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.208.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.208.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.208.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.208.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.208.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.209.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.209.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.209.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.209.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.209.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.209.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.210.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.210.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.210.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.210.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.210.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.210.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.211.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.211.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.211.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.211.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.211.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.211.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.212.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.212.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.212.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.212.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.212.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.212.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.213.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.213.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.213.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.213.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.213.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.213.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.214.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.214.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.214.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.214.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.214.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.214.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.215.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.215.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.215.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.215.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.215.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.215.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.216.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.216.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.216.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.216.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.216.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.216.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.217.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.217.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.217.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.217.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.217.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.217.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.218.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.218.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.218.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.218.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.218.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.218.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.219.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.219.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.219.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.219.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.219.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.219.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.220.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.220.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.220.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.220.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.220.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.220.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.221.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.221.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.221.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.221.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.221.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.221.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.222.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.222.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.222.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.222.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.222.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.222.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.223.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.223.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.223.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.223.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.223.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.223.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.224.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.224.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.224.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.224.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.224.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.224.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.225.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.225.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.225.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.225.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.225.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.225.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.226.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.226.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.226.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.226.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.226.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.226.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.227.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.227.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.227.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.227.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.227.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.227.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.228.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.228.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.228.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.228.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.228.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.228.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.229.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.229.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.229.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.229.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.229.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.229.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.230.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.230.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.230.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.230.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.230.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.230.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.231.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.231.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.231.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.231.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.231.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.231.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.232.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.232.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.232.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.232.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.232.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.232.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.233.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.233.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.233.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.233.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.233.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.233.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.234.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.234.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.234.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.234.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.234.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.234.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.235.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.235.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.235.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.235.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.235.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.235.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.236.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.236.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.236.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.236.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.236.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.236.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.237.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.237.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.237.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.237.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.237.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.237.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.238.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.238.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.238.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.238.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.238.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.238.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.239.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.239.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.239.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.239.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.239.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.239.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.240.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.240.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.240.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.240.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.240.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.240.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.241.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.241.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.241.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.241.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.241.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.241.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.242.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.242.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.242.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.242.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.242.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.242.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.243.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.243.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.243.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.243.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.243.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.243.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.244.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.244.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.244.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.244.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.244.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.244.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.245.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.245.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.245.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.245.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.245.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.245.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.246.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.246.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.246.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.246.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.246.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.246.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.247.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.247.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.247.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.247.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.247.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.247.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.248.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.248.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.248.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.248.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.248.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.248.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.249.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.249.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.249.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.249.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.249.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.249.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.250.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.250.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.250.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.250.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.250.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.250.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.251.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.251.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.251.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.251.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.251.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.251.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.252.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.252.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.252.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.252.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.252.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.252.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.253.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.253.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.253.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.253.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.253.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.253.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.254.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.254.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.254.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.254.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.254.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.254.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.255.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.255.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.255.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.255.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.255.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.255.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.input_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.12.post_attention_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.q_a_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.q_a_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.q_a_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.q_b_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.q_b_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.kv_b_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.kv_b_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.o_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.o_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.gate.weight": "model-00029-of-000163.safetensors", "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-000163.safetensors", "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.shared_experts.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.shared_experts.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.0.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.0.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.0.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.0.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.0.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.1.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.1.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.1.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.1.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.1.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.2.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.2.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.2.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.2.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.2.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.3.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.3.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.3.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.3.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.3.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.4.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.4.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.4.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.4.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.4.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.5.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.5.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.5.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.5.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.5.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.6.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.6.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.6.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.6.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.6.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.7.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.7.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.7.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.7.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.7.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.8.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.8.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.8.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.8.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.8.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.9.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.9.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.9.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.9.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.9.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.10.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.10.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.10.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.10.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.10.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.11.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.11.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.11.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.11.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.11.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.12.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.12.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.12.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.12.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.12.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.13.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.13.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.13.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.13.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.13.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.14.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.14.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.14.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.14.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.14.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.15.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.15.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.15.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.15.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.15.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.16.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.16.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.16.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.16.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.16.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.17.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.17.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.17.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.17.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.17.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.18.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.18.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.18.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.18.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.18.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.19.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.19.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.19.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.19.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.19.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.20.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.20.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.20.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.20.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.20.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.21.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.21.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.21.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.21.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.21.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.22.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.22.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.22.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.22.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.22.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.23.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.23.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.23.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.23.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.23.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.24.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.24.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.24.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.24.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.24.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.25.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.25.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.25.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.25.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.25.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.26.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.26.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.26.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.26.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.26.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.27.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.27.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.27.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.27.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.27.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.28.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.28.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.28.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.28.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.28.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.29.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.29.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.29.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.29.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.29.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.30.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.30.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.30.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.30.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.30.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.31.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.31.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.31.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.31.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.31.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.32.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.32.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.32.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.32.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.32.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.33.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.33.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.33.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.33.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.33.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.34.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.34.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.34.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.34.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.34.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.35.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.35.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.35.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.35.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.35.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.36.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.36.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.36.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.36.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.36.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.37.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.37.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.37.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.37.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.37.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.38.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.38.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.38.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.38.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.38.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.39.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.39.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.39.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.39.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.39.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.40.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.40.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.40.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.40.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.40.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.41.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.41.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.41.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.41.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.41.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.42.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.42.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.42.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.42.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.42.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.43.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.43.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.43.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.43.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.43.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.44.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.44.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.44.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.44.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.44.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.45.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.45.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.45.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.45.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.45.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.46.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.46.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.46.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.46.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.46.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.47.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.47.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.47.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.47.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.47.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.48.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.48.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.48.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.48.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.48.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.49.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.49.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.49.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.49.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.49.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.50.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.50.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.50.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.50.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.50.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.51.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.51.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.51.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.51.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.51.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.52.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.52.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.52.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.52.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.52.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.53.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.53.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.53.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.53.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.53.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.54.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.54.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.54.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.54.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.54.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.55.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.55.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.55.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.55.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.55.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.56.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.56.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.56.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.56.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.56.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.57.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.57.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.57.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.57.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.57.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.58.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.58.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.58.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.58.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.58.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.59.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.59.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.59.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.59.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.59.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.60.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.60.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.60.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.60.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.60.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.61.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.61.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.61.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.61.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.61.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.62.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.62.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.62.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.62.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.62.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.63.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.63.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.63.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.63.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.63.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.64.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.64.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.64.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.64.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.64.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.65.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.65.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.65.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.65.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.65.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.66.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.66.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.66.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.66.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.66.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.67.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.67.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.67.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.67.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.67.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.68.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.68.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.68.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.68.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.68.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.69.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.69.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.69.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.69.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.69.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.70.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.70.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.70.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.70.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.70.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.71.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.71.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.71.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.71.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.71.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.72.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.72.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.72.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.72.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.72.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.73.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.73.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.73.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.73.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.73.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.74.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.74.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.74.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.74.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.74.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.75.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.75.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.75.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.75.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.75.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.76.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.76.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.76.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.76.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.76.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.77.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.77.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.77.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.77.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.77.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.78.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.78.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.78.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.78.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.78.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.79.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.79.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.79.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.79.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.79.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.80.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.80.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.80.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.80.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.80.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.81.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.81.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.81.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.81.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.81.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.82.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.82.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.82.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.82.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.82.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.83.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.83.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.83.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.83.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.83.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.84.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.84.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.84.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.84.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.84.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.85.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.85.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.85.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.85.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.85.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.86.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.86.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.86.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.86.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.86.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.87.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.87.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.87.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.87.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.87.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.88.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.88.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.88.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.88.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.88.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.89.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.89.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.89.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.89.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.89.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.90.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.90.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.90.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.90.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.90.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.91.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.91.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.91.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.91.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.91.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.92.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.92.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.92.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.92.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.92.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.93.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.93.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.93.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.93.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.93.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.94.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.94.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.94.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.94.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.94.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.95.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.95.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.95.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.95.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.95.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.96.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.96.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.96.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.96.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.96.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.97.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.97.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.97.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.97.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.97.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.98.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.98.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.98.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.98.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.98.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.99.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.99.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.99.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.99.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.99.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.100.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.100.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.100.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.100.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.100.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.101.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.101.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.101.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.101.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.101.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.102.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.102.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.102.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.102.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.102.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.103.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.103.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.103.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.103.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.103.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.104.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.104.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.104.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.104.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.104.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.105.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.105.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.105.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.105.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.105.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.106.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.106.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.106.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.106.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.106.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.107.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.107.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.107.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.107.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.107.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.108.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.108.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.108.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.108.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.108.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.109.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.109.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.109.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.109.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.109.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.110.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.110.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.110.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.110.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.110.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.111.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.111.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.111.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.111.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.111.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.112.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.112.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.112.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.112.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.112.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.113.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.113.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.113.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.113.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.113.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.114.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.114.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.114.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.114.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.114.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.115.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.115.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.115.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.115.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.115.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.116.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.116.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.116.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.116.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.116.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.117.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.117.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.117.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.117.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.117.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.118.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.118.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.118.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.118.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.118.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.119.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.119.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.119.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.119.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.119.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.120.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.120.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.120.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.120.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.120.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.121.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.121.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.121.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.121.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.121.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.122.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.122.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.122.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.122.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.122.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.123.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.123.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.123.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.123.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.123.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.124.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.124.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.124.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.124.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.124.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.125.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.125.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.125.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.125.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.125.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.126.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.126.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.126.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.126.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.126.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.127.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.127.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.127.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.127.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.127.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.128.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.128.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.128.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.128.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.128.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.129.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.129.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.129.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.129.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.129.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.130.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.130.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.130.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.130.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.130.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.131.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.131.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.131.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.131.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.131.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.132.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.132.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.132.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.132.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.132.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.133.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.133.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.133.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.133.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.133.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.134.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.134.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.134.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.134.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.134.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.135.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.135.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.135.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.135.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.135.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.136.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.136.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.136.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.136.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.136.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.137.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.137.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.137.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.137.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.137.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.138.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.138.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.138.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.138.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.138.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.139.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.139.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.139.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.139.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.139.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.140.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.140.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.140.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.140.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.140.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.141.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.141.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.141.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.141.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.141.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.142.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.142.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.142.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.142.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.142.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.143.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.143.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.143.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.143.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.143.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.144.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.144.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.144.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.144.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.144.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.145.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.145.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.145.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.145.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.145.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.146.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.146.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.146.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.146.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.146.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.147.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.147.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.147.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.147.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.147.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.148.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.148.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.148.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.148.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.148.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.149.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.149.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.149.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.149.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.149.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.150.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.150.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.150.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.150.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.150.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.151.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.151.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.151.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.151.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.151.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.152.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.152.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.152.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.152.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.152.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.153.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.153.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.153.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.153.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.153.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.154.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.154.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.154.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.154.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.154.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.155.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.155.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.155.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.155.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.155.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.156.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.156.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.156.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.156.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.156.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.157.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.157.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.157.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.157.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.157.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.158.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.158.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.158.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.158.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.158.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.159.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.159.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.159.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.159.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.159.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.160.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.160.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.160.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.160.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.160.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.160.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.161.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.161.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.161.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.161.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.161.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.161.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.162.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.162.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.162.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.162.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.162.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.162.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.163.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.163.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.163.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.163.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.163.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.163.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.164.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.164.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.164.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.164.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.164.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.164.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.165.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.165.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.165.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.165.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.165.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.165.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.166.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.166.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.166.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.166.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.166.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.166.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.167.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.167.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.167.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.167.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.167.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.167.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.168.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.168.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.168.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.168.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.168.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.168.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.169.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.169.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.169.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.169.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.169.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.169.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.170.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.170.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.170.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.170.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.170.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.170.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.171.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.171.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.171.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.171.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.171.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.171.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.172.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.172.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.172.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.172.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.172.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.172.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.173.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.173.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.173.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.173.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.173.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.173.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.174.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.174.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.174.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.174.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.174.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.174.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.175.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.175.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.175.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.175.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.175.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.175.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.176.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.176.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.176.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.176.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.176.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.176.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.177.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.177.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.177.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.177.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.177.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.177.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.178.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.178.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.178.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.178.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.178.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.178.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.179.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.179.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.179.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.179.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.179.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.179.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.180.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.180.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.180.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.180.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.180.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.180.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.181.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.181.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.181.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.181.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.181.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.181.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.182.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.182.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.182.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.182.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.182.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.182.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.183.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.183.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.183.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.183.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.183.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.183.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.184.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.184.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.184.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.184.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.184.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.184.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.185.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.185.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.185.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.185.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.185.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.185.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.186.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.186.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.186.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.186.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.186.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.186.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.187.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.187.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.187.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.187.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.187.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.187.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.188.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.188.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.188.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.188.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.188.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.188.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.189.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.189.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.189.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.189.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.189.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.189.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.190.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.190.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.190.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.190.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.190.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.190.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.191.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.191.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.191.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.191.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.191.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.191.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.192.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.192.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.192.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.192.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.192.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.192.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.193.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.193.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.193.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.193.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.193.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.193.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.194.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.194.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.194.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.194.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.194.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.194.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.195.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.195.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.195.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.195.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.195.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.195.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.196.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.196.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.196.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.196.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.196.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.196.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.197.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.197.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.197.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.197.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.197.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.197.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.198.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.198.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.198.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.198.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.198.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.198.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.199.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.199.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.199.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.199.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.199.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.199.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.200.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.200.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.200.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.200.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.200.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.200.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.201.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.201.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.201.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.201.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.201.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.201.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.202.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.202.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.202.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.202.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.202.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.202.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.203.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.203.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.203.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.203.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.203.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.203.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.204.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.204.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.204.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.204.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.204.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.204.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.205.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.205.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.205.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.205.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.205.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.205.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.206.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.206.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.206.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.206.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.206.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.206.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.207.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.207.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.207.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.207.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.207.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.207.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.208.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.208.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.208.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.208.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.208.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.208.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.209.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.209.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.209.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.209.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.209.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.209.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.210.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.210.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.210.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.210.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.210.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.210.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.211.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.211.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.211.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.211.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.211.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.211.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.212.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.212.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.212.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.212.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.212.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.212.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.213.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.213.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.213.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.213.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.213.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.213.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.214.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.214.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.214.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.214.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.214.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.214.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.215.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.215.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.215.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.215.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.215.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.215.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.216.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.216.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.216.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.216.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.216.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.216.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.217.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.217.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.217.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.217.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.217.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.217.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.218.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.218.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.218.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.218.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.218.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.218.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.219.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.219.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.219.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.219.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.219.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.219.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.220.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.220.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.220.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.220.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.220.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.220.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.221.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.221.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.221.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.221.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.221.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.221.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.222.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.222.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.222.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.222.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.222.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.222.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.223.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.223.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.223.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.223.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.223.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.223.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.224.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.224.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.224.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.224.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.224.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.224.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.225.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.225.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.225.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.225.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.225.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.225.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.226.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.226.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.226.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.226.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.226.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.226.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.227.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.227.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.227.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.227.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.227.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.227.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.228.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.228.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.228.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.228.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.228.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.228.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.229.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.229.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.229.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.229.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.229.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.229.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.230.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.230.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.230.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.230.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.230.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.230.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.231.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.231.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.231.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.231.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.231.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.231.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.232.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.232.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.232.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.232.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.232.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.232.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.233.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.233.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.233.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.233.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.233.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.233.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.234.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.234.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.234.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.234.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.234.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.234.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.235.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.235.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.235.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.235.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.235.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.235.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.236.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.236.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.236.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.236.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.236.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.236.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.237.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.237.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.237.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.237.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.237.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.237.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.238.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.238.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.238.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.238.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.238.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.238.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.239.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.239.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.239.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.239.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.239.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.239.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.240.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.240.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.240.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.240.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.240.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.240.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.241.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.241.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.241.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.241.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.241.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.241.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.242.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.242.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.242.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.242.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.242.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.242.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.243.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.243.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.243.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.243.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.243.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.243.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.244.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.244.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.244.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.244.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.244.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.244.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.245.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.245.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.245.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.245.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.245.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.245.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.246.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.246.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.246.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.246.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.246.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.246.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.247.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.247.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.247.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.247.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.247.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.247.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.248.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.248.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.248.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.248.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.248.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.248.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.249.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.249.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.249.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.249.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.249.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.249.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.250.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.250.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.250.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.250.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.250.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.250.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.251.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.251.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.251.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.251.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.251.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.251.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.252.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.252.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.252.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.252.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.252.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.252.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.253.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.253.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.253.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.253.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.253.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.253.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.254.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.254.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.254.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.254.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.254.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.254.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.255.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.255.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.255.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.255.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.255.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.255.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.input_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.13.post_attention_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.q_a_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.q_a_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.q_a_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.q_b_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.q_b_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.kv_b_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.kv_b_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.o_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.o_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.gate.weight": "model-00031-of-000163.safetensors", "model.layers.14.mlp.gate.e_score_correction_bias": "model-00031-of-000163.safetensors", "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.shared_experts.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.shared_experts.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.0.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.0.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.0.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.0.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.0.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.1.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.1.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.1.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.1.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.1.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.2.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.2.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.2.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.2.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.2.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.3.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.3.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.3.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.3.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.3.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.4.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.4.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.4.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.4.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.4.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.5.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.5.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.5.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.5.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.5.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.6.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.6.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.6.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.6.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.6.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.7.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.7.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.7.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.7.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.7.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.8.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.8.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.8.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.8.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.8.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.9.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.9.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.9.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.9.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.9.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.10.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.10.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.10.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.10.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.10.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.11.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.11.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.11.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.11.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.11.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.12.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.12.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.12.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.12.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.12.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.13.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.13.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.13.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.13.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.13.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.14.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.14.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.14.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.14.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.14.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.15.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.15.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.15.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.15.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.15.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.16.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.16.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.16.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.16.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.16.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.17.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.17.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.17.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.17.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.17.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.18.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.18.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.18.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.18.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.18.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.19.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.19.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.19.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.19.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.19.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.20.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.20.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.20.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.20.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.20.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.21.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.21.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.21.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.21.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.21.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.22.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.22.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.22.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.22.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.22.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.23.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.23.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.23.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.23.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.23.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.24.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.24.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.24.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.24.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.24.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.25.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.25.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.25.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.25.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.25.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.26.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.26.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.26.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.26.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.26.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.27.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.27.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.27.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.27.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.27.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.28.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.28.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.28.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.28.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.28.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.29.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.29.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.29.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.29.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.29.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.30.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.30.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.30.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.30.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.30.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.31.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.31.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.31.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.31.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.31.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.32.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.32.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.32.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.32.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.32.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.33.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.33.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.33.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.33.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.33.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.34.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.34.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.34.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.34.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.34.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.35.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.35.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.35.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.35.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.35.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.36.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.36.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.36.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.36.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.36.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.37.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.37.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.37.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.37.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.37.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.38.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.38.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.38.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.38.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.38.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.39.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.39.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.39.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.39.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.39.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.40.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.40.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.40.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.40.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.40.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.41.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.41.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.41.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.41.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.41.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.42.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.42.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.42.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.42.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.42.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.43.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.43.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.43.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.43.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.43.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.44.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.44.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.44.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.44.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.44.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.45.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.45.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.45.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.45.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.45.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.46.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.46.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.46.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.46.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.46.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.47.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.47.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.47.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.47.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.47.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.48.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.48.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.48.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.48.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.48.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.49.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.49.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.49.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.49.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.49.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.50.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.50.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.50.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.50.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.50.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.51.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.51.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.51.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.51.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.51.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.52.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.52.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.52.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.52.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.52.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.53.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.53.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.53.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.53.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.53.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.54.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.54.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.54.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.54.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.54.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.55.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.55.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.55.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.55.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.55.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.56.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.56.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.56.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.56.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.56.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.57.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.57.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.57.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.57.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.57.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.58.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.58.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.58.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.58.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.58.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.59.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.59.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.59.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.59.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.59.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.60.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.60.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.60.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.60.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.60.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.61.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.61.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.61.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.61.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.61.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.62.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.62.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.62.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.62.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.62.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.63.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.63.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.63.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.63.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.63.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.64.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.64.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.64.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.64.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.64.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.65.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.65.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.65.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.65.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.65.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.66.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.66.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.66.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.66.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.66.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.67.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.67.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.67.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.67.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.67.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.68.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.68.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.68.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.68.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.68.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.69.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.69.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.69.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.69.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.69.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.70.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.70.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.70.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.70.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.70.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.71.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.71.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.71.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.71.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.71.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.72.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.72.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.72.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.72.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.72.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.73.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.73.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.73.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.73.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.73.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.74.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.74.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.74.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.74.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.74.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.75.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.75.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.75.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.75.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.75.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.76.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.76.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.76.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.76.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.76.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.77.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.77.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.77.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.77.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.77.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.78.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.78.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.78.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.78.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.78.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.79.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.79.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.79.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.79.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.79.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.80.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.80.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.80.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.80.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.80.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.81.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.81.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.81.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.81.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.81.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.82.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.82.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.82.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.82.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.82.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.83.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.83.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.83.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.83.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.83.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.84.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.84.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.84.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.84.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.84.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.85.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.85.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.85.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.85.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.85.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.86.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.86.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.86.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.86.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.86.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.87.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.87.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.87.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.87.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.87.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.88.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.88.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.88.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.88.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.88.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.89.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.89.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.89.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.89.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.89.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.90.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.90.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.90.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.90.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.90.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.91.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.91.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.91.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.91.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.91.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.92.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.92.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.92.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.92.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.92.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.93.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.93.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.93.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.93.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.93.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.94.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.94.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.94.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.94.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.94.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.95.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.95.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.95.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.95.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.95.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.96.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.96.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.96.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.96.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.96.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.97.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.97.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.97.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.97.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.97.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.98.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.98.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.98.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.98.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.98.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.99.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.99.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.99.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.99.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.99.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.100.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.100.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.100.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.100.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.100.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.101.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.101.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.101.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.101.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.101.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.102.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.102.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.102.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.102.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.102.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.103.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.103.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.103.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.103.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.103.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.104.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.104.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.104.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.104.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.104.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.105.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.105.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.105.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.105.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.105.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.106.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.106.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.106.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.106.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.106.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.107.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.107.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.107.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.107.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.107.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.108.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.108.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.108.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.108.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.108.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.109.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.109.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.109.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.109.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.109.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.110.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.110.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.110.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.110.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.110.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.111.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.111.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.111.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.111.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.111.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.112.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.112.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.112.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.112.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.112.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.113.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.113.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.113.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.113.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.113.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.114.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.114.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.114.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.114.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.114.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.115.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.115.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.115.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.115.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.115.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.116.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.116.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.116.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.116.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.116.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.117.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.117.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.117.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.117.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.117.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.118.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.118.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.118.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.118.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.118.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.119.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.119.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.119.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.119.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.119.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.120.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.120.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.120.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.120.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.120.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.121.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.121.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.121.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.121.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.121.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.122.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.122.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.122.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.122.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.122.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.123.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.123.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.123.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.123.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.123.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.124.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.124.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.124.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.124.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.124.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.125.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.125.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.125.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.125.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.125.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.126.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.126.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.126.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.126.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.126.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.127.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.127.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.127.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.127.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.127.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.128.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.128.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.128.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.128.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.128.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.129.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.129.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.129.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.129.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.129.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.130.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.130.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.130.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.130.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.130.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.131.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.131.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.131.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.131.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.131.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.132.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.132.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.132.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.132.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.132.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.133.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.133.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.133.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.133.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.133.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.134.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.134.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.134.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.134.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.134.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.135.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.135.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.135.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.135.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.135.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.136.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.136.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.136.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.136.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.136.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.137.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.137.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.137.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.137.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.137.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.138.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.138.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.138.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.138.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.138.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.139.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.139.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.139.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.139.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.139.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.140.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.140.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.140.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.140.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.140.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.141.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.141.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.141.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.141.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.141.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.142.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.142.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.142.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.142.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.142.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.143.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.143.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.143.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.143.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.143.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.144.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.144.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.144.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.144.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.144.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.145.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.145.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.145.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.145.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.145.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.146.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.146.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.146.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.146.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.146.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.147.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.147.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.147.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.147.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.147.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.148.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.148.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.148.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.148.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.148.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.149.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.149.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.149.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.149.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.149.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.150.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.150.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.150.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.150.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.150.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.151.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.151.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.151.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.151.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.151.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.152.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.152.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.152.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.152.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.152.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.153.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.153.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.153.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.153.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.153.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.154.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.154.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.154.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.154.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.154.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.155.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.155.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.155.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.155.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.155.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.156.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.156.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.156.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.156.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.156.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.157.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.157.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.157.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.157.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.157.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.158.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.158.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.158.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.158.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.158.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.159.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.159.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.159.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.159.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.159.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.160.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.160.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.160.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.160.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.160.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.160.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.161.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.161.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.161.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.161.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.161.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.161.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.162.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.162.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.162.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.162.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.162.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.162.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.163.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.163.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.163.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.163.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.163.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.163.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.164.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.164.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.164.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.164.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.164.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.164.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.165.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.165.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.165.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.165.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.165.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.165.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.166.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.166.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.166.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.166.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.166.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.166.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.167.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.167.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.167.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.167.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.167.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.167.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.168.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.168.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.168.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.168.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.168.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.168.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.169.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.169.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.169.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.169.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.169.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.169.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.170.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.170.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.170.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.170.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.170.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.170.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.171.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.171.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.171.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.171.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.171.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.171.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.172.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.172.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.172.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.172.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.172.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.172.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.173.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.173.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.173.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.173.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.173.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.173.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.174.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.174.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.174.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.174.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.174.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.174.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.175.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.175.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.175.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.175.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.175.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.175.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.176.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.176.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.176.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.176.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.176.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.176.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.177.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.177.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.177.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.177.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.177.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.177.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.178.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.178.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.178.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.178.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.178.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.178.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.179.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.179.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.179.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.179.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.179.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.179.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.180.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.180.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.180.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.180.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.180.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.180.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.181.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.181.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.181.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.181.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.181.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.181.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.182.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.182.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.182.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.182.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.182.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.182.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.183.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.183.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.183.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.183.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.183.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.183.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.184.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.184.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.184.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.184.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.184.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.184.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.185.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.185.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.185.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.185.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.185.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.185.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.186.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.186.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.186.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.186.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.186.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.186.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.187.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.187.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.187.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.187.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.187.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.187.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.188.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.188.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.188.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.188.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.188.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.188.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.189.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.189.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.189.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.189.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.189.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.189.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.190.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.190.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.190.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.190.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.190.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.190.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.191.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.191.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.191.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.191.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.191.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.191.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.192.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.192.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.192.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.192.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.192.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.192.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.193.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.193.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.193.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.193.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.193.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.193.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.194.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.194.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.194.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.194.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.194.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.194.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.195.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.195.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.195.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.195.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.195.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.195.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.196.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.196.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.196.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.196.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.196.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.196.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.197.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.197.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.197.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.197.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.197.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.197.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.198.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.198.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.198.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.198.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.198.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.198.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.199.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.199.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.199.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.199.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.199.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.199.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.200.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.200.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.200.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.200.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.200.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.200.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.201.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.201.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.201.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.201.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.201.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.201.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.202.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.202.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.202.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.202.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.202.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.202.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.203.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.203.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.203.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.203.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.203.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.203.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.204.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.204.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.204.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.204.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.204.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.204.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.205.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.205.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.205.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.205.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.205.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.205.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.206.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.206.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.206.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.206.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.206.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.206.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.207.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.207.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.207.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.207.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.207.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.207.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.208.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.208.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.208.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.208.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.208.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.208.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.209.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.209.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.209.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.209.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.209.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.209.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.210.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.210.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.210.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.210.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.210.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.210.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.211.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.211.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.211.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.211.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.211.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.211.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.212.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.212.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.212.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.212.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.212.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.212.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.213.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.213.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.213.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.213.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.213.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.213.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.214.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.214.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.214.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.214.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.214.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.214.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.215.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.215.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.215.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.215.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.215.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.215.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.216.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.216.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.216.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.216.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.216.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.216.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.217.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.217.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.217.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.217.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.217.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.217.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.218.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.218.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.218.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.218.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.218.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.218.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.219.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.219.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.219.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.219.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.219.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.219.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.220.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.220.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.220.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.220.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.220.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.220.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.221.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.221.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.221.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.221.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.221.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.221.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.222.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.222.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.222.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.222.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.222.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.222.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.223.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.223.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.223.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.223.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.223.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.223.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.224.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.224.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.224.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.224.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.224.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.224.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.225.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.225.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.225.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.225.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.225.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.225.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.226.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.226.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.226.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.226.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.226.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.226.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.227.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.227.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.227.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.227.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.227.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.227.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.228.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.228.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.228.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.228.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.228.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.228.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.229.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.229.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.229.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.229.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.229.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.229.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.230.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.230.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.230.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.230.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.230.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.230.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.231.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.231.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.231.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.231.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.231.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.231.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.232.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.232.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.232.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.232.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.232.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.232.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.233.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.233.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.233.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.233.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.233.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.233.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.234.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.234.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.234.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.234.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.234.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.234.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.235.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.235.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.235.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.235.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.235.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.235.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.236.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.236.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.236.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.236.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.236.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.236.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.237.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.237.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.237.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.237.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.237.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.237.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.238.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.238.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.238.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.238.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.238.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.238.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.239.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.239.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.239.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.239.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.239.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.239.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.240.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.240.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.240.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.240.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.240.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.240.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.241.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.241.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.241.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.241.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.241.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.241.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.242.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.242.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.242.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.242.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.242.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.242.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.243.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.243.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.243.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.243.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.243.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.243.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.244.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.244.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.244.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.244.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.244.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.244.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.245.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.245.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.245.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.245.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.245.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.245.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.246.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.246.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.246.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.246.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.246.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.246.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.247.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.247.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.247.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.247.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.247.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.247.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.248.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.248.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.248.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.248.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.248.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.248.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.249.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.249.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.249.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.249.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.249.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.249.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.250.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.250.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.250.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.250.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.250.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.250.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.251.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.251.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.251.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.251.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.251.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.251.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.252.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.252.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.252.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.252.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.252.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.252.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.253.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.253.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.253.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.253.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.253.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.253.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.254.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.254.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.254.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.254.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.254.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.254.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.255.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.255.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.255.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.255.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.255.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.255.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.input_layernorm.weight": "model-00034-of-000163.safetensors", "model.layers.14.post_attention_layernorm.weight": "model-00034-of-000163.safetensors", "model.layers.15.self_attn.q_a_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.q_a_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.q_a_layernorm.weight": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.q_b_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.q_b_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.kv_b_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.kv_b_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.o_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.o_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.gate.weight": "model-00035-of-000163.safetensors", "model.layers.15.mlp.gate.e_score_correction_bias": "model-00035-of-000163.safetensors", "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.shared_experts.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.shared_experts.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.0.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.0.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.0.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.0.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.0.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.1.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.1.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.1.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.1.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.1.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.2.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.2.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.2.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.2.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.2.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.3.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.3.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.3.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.3.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.3.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.4.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.4.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.4.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.4.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.4.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.5.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.5.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.5.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.5.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.5.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.6.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.6.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.6.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.6.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.6.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.7.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.7.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.7.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.7.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.7.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.8.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.8.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.8.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.8.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.8.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.9.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.9.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.9.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.9.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.9.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.10.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.10.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.10.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.10.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.10.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.11.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.11.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.11.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.11.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.11.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.12.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.12.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.12.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.12.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.12.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.13.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.13.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.13.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.13.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.13.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.14.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.14.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.14.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.14.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.14.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.15.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.15.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.15.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.15.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.15.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.16.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.16.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.16.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.16.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.16.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.17.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.17.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.17.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.17.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.17.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.18.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.18.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.18.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.18.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.18.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.19.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.19.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.19.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.19.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.19.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.20.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.20.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.20.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.20.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.20.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.21.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.21.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.21.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.21.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.21.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.22.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.22.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.22.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.22.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.22.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.23.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.23.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.23.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.23.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.23.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.24.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.24.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.24.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.24.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.24.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.25.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.25.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.25.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.25.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.25.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.26.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.26.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.26.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.26.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.26.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.27.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.27.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.27.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.27.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.27.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.28.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.28.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.28.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.28.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.28.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.29.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.29.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.29.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.29.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.29.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.30.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.30.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.30.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.30.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.30.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.31.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.31.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.31.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.31.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.31.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.32.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.32.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.32.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.32.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.32.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.33.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.33.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.33.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.33.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.33.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.34.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.34.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.34.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.34.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.34.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.35.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.35.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.35.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.35.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.35.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.36.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.36.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.36.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.36.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.36.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.37.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.37.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.37.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.37.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.37.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.38.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.38.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.38.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.38.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.38.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.39.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.39.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.39.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.39.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.39.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.40.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.40.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.40.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.40.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.40.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.41.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.41.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.41.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.41.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.41.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.42.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.42.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.42.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.42.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.42.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.43.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.43.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.43.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.43.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.43.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.44.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.44.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.44.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.44.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.44.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.45.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.45.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.45.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.45.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.45.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.46.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.46.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.46.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.46.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.46.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.47.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.47.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.47.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.47.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.47.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.48.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.48.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.48.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.48.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.48.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.49.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.49.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.49.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.49.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.49.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.50.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.50.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.50.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.50.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.50.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.51.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.51.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.51.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.51.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.51.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.52.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.52.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.52.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.52.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.52.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.53.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.53.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.53.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.53.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.53.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.54.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.54.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.54.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.54.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.54.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.55.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.55.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.55.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.55.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.55.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.56.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.56.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.56.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.56.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.56.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.57.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.57.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.57.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.57.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.57.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.58.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.58.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.58.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.58.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.58.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.59.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.59.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.59.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.59.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.59.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.60.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.60.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.60.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.60.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.60.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.61.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.61.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.61.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.61.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.61.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.62.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.62.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.62.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.62.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.62.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.63.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.63.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.63.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.63.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.63.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.64.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.64.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.64.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.64.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.64.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.65.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.65.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.65.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.65.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.65.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.66.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.66.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.66.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.66.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.66.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.67.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.67.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.67.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.67.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.67.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.68.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.68.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.68.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.68.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.68.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.69.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.69.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.69.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.69.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.69.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.70.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.70.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.70.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.70.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.70.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.71.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.71.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.71.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.71.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.71.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.72.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.72.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.72.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.72.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.72.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.73.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.73.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.73.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.73.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.73.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.74.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.74.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.74.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.74.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.74.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.75.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.75.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.75.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.75.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.75.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.76.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.76.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.76.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.76.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.76.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.77.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.77.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.77.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.77.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.77.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.78.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.78.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.78.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.78.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.78.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.79.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.79.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.79.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.79.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.79.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.80.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.80.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.80.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.80.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.80.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.81.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.81.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.81.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.81.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.81.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.82.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.82.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.82.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.82.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.82.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.83.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.83.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.83.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.83.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.83.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.84.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.84.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.84.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.84.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.84.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.85.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.85.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.85.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.85.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.85.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.86.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.86.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.86.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.86.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.86.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.87.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.87.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.87.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.87.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.87.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.88.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.88.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.88.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.88.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.88.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.89.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.89.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.89.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.89.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.89.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.90.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.90.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.90.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.90.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.90.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.91.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.91.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.91.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.91.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.91.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.92.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.92.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.92.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.92.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.92.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.93.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.93.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.93.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.93.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.93.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.94.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.94.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.94.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.94.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.94.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.95.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.95.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.95.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.95.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.95.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.96.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.96.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.96.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.96.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.96.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.97.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.97.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.97.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.97.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.97.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.98.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.98.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.98.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.98.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.98.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.99.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.99.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.99.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.99.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.99.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.100.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.100.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.100.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.100.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.100.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.101.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.101.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.101.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.101.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.101.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.102.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.102.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.102.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.102.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.102.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.103.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.103.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.103.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.103.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.103.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.104.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.104.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.104.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.104.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.104.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.105.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.105.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.105.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.105.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.105.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.106.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.106.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.106.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.106.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.106.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.107.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.107.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.107.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.107.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.107.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.108.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.108.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.108.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.108.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.108.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.109.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.109.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.109.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.109.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.109.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.110.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.110.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.110.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.110.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.110.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.111.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.111.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.111.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.111.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.111.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.112.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.112.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.112.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.112.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.112.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.113.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.113.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.113.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.113.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.113.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.114.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.114.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.114.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.114.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.114.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.115.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.115.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.115.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.115.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.115.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.116.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.116.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.116.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.116.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.116.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.117.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.117.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.117.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.117.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.117.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.118.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.118.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.118.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.118.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.118.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.119.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.119.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.119.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.119.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.119.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.120.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.120.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.120.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.120.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.120.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.121.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.121.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.121.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.121.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.121.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.122.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.122.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.122.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.122.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.122.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.123.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.123.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.123.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.123.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.123.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.124.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.124.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.124.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.124.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.124.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.125.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.125.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.125.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.125.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.125.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.126.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.126.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.126.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.126.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.126.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.127.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.127.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.127.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.127.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.127.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.128.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.128.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.128.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.128.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.128.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.129.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.129.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.129.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.129.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.129.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.130.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.130.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.130.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.130.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.130.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.131.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.131.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.131.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.131.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.131.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.132.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.132.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.132.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.132.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.132.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.133.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.133.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.133.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.133.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.133.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.134.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.134.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.134.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.134.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.134.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.135.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.135.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.135.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.135.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.135.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.136.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.136.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.136.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.136.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.136.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.137.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.137.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.137.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.137.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.137.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.138.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.138.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.138.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.138.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.138.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.139.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.139.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.139.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.139.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.139.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.140.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.140.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.140.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.140.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.140.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.141.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.141.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.141.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.141.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.141.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.142.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.142.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.142.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.142.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.142.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.143.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.143.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.143.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.143.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.143.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.144.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.144.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.144.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.144.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.144.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.145.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.145.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.145.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.145.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.145.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.146.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.146.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.146.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.146.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.146.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.147.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.147.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.147.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.147.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.147.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.148.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.148.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.148.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.148.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.148.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.149.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.149.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.149.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.149.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.149.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.150.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.150.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.150.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.150.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.150.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.151.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.151.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.151.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.151.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.151.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.152.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.152.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.152.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.152.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.152.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.153.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.153.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.153.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.153.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.153.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.154.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.154.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.154.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.154.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.154.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.155.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.155.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.155.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.155.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.155.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.156.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.156.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.156.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.156.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.156.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.157.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.157.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.157.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.157.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.157.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.158.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.158.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.158.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.158.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.158.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.159.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.159.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.159.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.159.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.159.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.160.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.160.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.160.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.160.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.160.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.160.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.161.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.161.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.161.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.161.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.161.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.161.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.162.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.162.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.162.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.162.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.162.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.162.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.163.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.163.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.163.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.163.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.163.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.163.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.164.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.164.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.164.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.164.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.164.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.164.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.165.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.165.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.165.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.165.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.165.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.165.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.166.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.166.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.166.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.166.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.166.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.166.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.167.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.167.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.167.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.167.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.167.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.167.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.168.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.168.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.168.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.168.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.168.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.168.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.169.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.169.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.169.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.169.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.169.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.169.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.170.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.170.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.170.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.170.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.170.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.170.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.171.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.171.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.171.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.171.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.171.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.171.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.172.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.172.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.172.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.172.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.172.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.172.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.173.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.173.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.173.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.173.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.173.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.173.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.174.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.174.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.174.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.174.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.174.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.174.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.175.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.175.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.175.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.175.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.175.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.175.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.176.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.176.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.176.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.176.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.176.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.176.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.177.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.177.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.177.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.177.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.177.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.177.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.178.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.178.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.178.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.178.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.178.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.178.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.179.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.179.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.179.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.179.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.179.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.179.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.180.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.180.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.180.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.180.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.180.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.180.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.181.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.181.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.181.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.181.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.181.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.181.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.182.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.182.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.182.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.182.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.182.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.182.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.183.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.183.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.183.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.183.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.183.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.183.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.184.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.184.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.184.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.184.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.184.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.184.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.185.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.185.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.185.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.185.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.185.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.185.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.186.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.186.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.186.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.186.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.186.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.186.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.187.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.187.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.187.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.187.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.187.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.187.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.188.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.188.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.188.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.188.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.188.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.188.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.189.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.189.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.189.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.189.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.189.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.189.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.190.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.190.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.190.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.190.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.190.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.190.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.191.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.191.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.191.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.191.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.191.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.191.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.192.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.192.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.192.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.192.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.192.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.192.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.193.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.193.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.193.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.193.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.193.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.193.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.194.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.194.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.194.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.194.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.194.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.194.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.195.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.195.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.195.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.195.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.195.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.195.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.196.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.196.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.196.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.196.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.196.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.196.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.197.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.197.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.197.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.197.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.197.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.197.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.198.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.198.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.198.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.198.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.198.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.198.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.199.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.199.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.199.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.199.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.199.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.199.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.200.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.200.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.200.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.200.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.200.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.200.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.201.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.201.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.201.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.201.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.201.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.201.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.202.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.202.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.202.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.202.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.202.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.202.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.203.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.203.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.203.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.203.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.203.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.203.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.204.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.204.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.204.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.204.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.204.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.204.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.205.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.205.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.205.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.205.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.205.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.205.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.206.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.206.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.206.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.206.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.206.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.206.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.207.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.207.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.207.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.207.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.207.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.207.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.208.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.208.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.208.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.208.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.208.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.208.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.209.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.209.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.209.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.209.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.209.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.209.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.210.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.210.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.210.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.210.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.210.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.210.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.211.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.211.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.211.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.211.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.211.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.211.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.212.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.212.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.212.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.212.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.212.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.212.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.213.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.213.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.213.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.213.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.213.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.213.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.214.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.214.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.214.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.214.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.214.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.214.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.215.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.215.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.215.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.215.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.215.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.215.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.216.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.216.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.216.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.216.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.216.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.216.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.217.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.217.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.217.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.217.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.217.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.217.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.218.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.218.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.218.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.218.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.218.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.218.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.219.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.219.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.219.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.219.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.219.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.219.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.220.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.220.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.220.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.220.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.220.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.220.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.221.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.221.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.221.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.221.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.221.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.221.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.222.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.222.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.222.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.222.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.222.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.222.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.223.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.223.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.223.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.223.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.223.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.223.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.224.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.224.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.224.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.224.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.224.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.224.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.225.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.225.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.225.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.225.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.225.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.225.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.226.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.226.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.226.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.226.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.226.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.226.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.227.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.227.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.227.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.227.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.227.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.227.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.228.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.228.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.228.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.228.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.228.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.228.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.229.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.229.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.229.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.229.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.229.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.229.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.230.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.230.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.230.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.230.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.230.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.230.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.231.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.231.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.231.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.231.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.231.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.231.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.232.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.232.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.232.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.232.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.232.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.232.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.233.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.233.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.233.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.233.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.233.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.233.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.234.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.234.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.234.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.234.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.234.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.234.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.235.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.235.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.235.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.235.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.235.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.235.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.236.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.236.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.236.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.236.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.236.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.236.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.237.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.237.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.237.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.237.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.237.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.237.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.238.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.238.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.238.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.238.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.238.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.238.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.239.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.239.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.239.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.239.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.239.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.239.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.240.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.240.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.240.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.240.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.240.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.240.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.241.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.241.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.241.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.241.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.241.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.241.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.242.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.242.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.242.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.242.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.242.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.242.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.243.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.243.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.243.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.243.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.243.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.243.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.244.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.244.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.244.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.244.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.244.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.244.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.245.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.245.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.245.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.245.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.245.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.245.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.246.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.246.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.246.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.246.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.246.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.246.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.247.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.247.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.247.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.247.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.247.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.247.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.248.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.248.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.248.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.248.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.248.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.248.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.249.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.249.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.249.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.249.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.249.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.249.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.250.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.250.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.250.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.250.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.250.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.250.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.251.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.251.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.251.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.251.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.251.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.251.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.252.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.252.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.252.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.252.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.252.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.252.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.253.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.253.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.253.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.253.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.253.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.253.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.254.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.254.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.254.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.254.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.254.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.254.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.255.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.255.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.255.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.255.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.255.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.255.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.input_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.15.post_attention_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.q_a_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.q_a_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.q_a_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.q_b_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.q_b_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.kv_b_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.kv_b_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.o_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.o_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.gate.weight": "model-00037-of-000163.safetensors", "model.layers.16.mlp.gate.e_score_correction_bias": "model-00037-of-000163.safetensors", "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.shared_experts.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.shared_experts.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.0.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.0.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.0.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.0.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.0.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.1.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.1.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.1.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.1.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.1.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.2.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.2.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.2.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.2.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.2.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.3.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.3.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.3.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.3.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.3.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.4.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.4.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.4.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.4.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.4.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.5.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.5.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.5.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.5.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.5.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.6.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.6.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.6.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.6.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.6.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.7.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.7.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.7.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.7.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.7.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.8.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.8.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.8.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.8.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.8.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.9.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.9.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.9.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.9.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.9.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.10.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.10.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.10.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.10.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.10.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.11.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.11.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.11.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.11.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.11.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.12.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.12.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.12.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.12.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.12.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.13.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.13.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.13.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.13.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.13.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.14.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.14.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.14.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.14.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.14.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.15.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.15.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.15.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.15.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.15.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.16.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.16.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.16.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.16.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.16.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.17.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.17.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.17.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.17.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.17.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.18.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.18.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.18.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.18.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.18.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.19.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.19.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.19.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.19.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.19.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.20.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.20.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.20.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.20.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.20.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.21.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.21.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.21.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.21.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.21.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.22.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.22.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.22.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.22.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.22.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.23.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.23.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.23.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.23.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.23.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.24.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.24.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.24.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.24.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.24.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.25.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.25.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.25.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.25.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.25.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.26.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.26.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.26.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.26.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.26.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.27.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.27.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.27.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.27.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.27.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.28.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.28.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.28.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.28.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.28.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.29.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.29.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.29.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.29.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.29.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.30.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.30.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.30.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.30.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.30.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.31.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.31.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.31.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.31.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.31.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.32.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.32.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.32.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.32.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.32.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.33.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.33.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.33.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.33.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.33.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.34.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.34.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.34.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.34.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.34.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.35.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.35.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.35.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.35.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.35.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.36.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.36.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.36.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.36.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.36.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.37.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.37.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.37.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.37.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.37.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.38.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.38.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.38.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.38.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.38.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.39.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.39.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.39.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.39.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.39.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.40.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.40.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.40.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.40.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.40.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.41.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.41.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.41.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.41.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.41.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.42.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.42.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.42.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.42.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.42.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.43.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.43.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.43.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.43.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.43.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.44.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.44.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.44.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.44.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.44.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.45.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.45.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.45.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.45.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.45.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.46.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.46.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.46.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.46.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.46.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.47.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.47.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.47.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.47.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.47.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.48.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.48.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.48.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.48.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.48.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.49.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.49.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.49.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.49.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.49.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.50.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.50.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.50.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.50.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.50.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.51.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.51.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.51.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.51.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.51.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.52.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.52.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.52.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.52.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.52.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.53.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.53.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.53.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.53.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.53.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.54.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.54.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.54.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.54.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.54.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.55.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.55.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.55.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.55.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.55.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.56.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.56.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.56.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.56.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.56.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.57.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.57.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.57.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.57.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.57.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.58.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.58.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.58.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.58.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.58.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.59.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.59.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.59.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.59.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.59.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.60.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.60.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.60.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.60.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.60.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.61.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.61.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.61.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.61.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.61.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.62.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.62.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.62.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.62.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.62.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.63.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.63.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.63.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.63.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.63.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.64.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.64.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.64.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.64.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.64.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.65.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.65.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.65.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.65.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.65.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.66.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.66.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.66.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.66.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.66.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.67.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.67.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.67.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.67.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.67.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.68.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.68.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.68.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.68.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.68.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.69.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.69.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.69.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.69.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.69.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.70.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.70.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.70.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.70.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.70.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.71.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.71.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.71.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.71.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.71.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.72.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.72.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.72.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.72.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.72.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.73.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.73.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.73.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.73.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.73.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.74.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.74.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.74.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.74.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.74.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.75.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.75.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.75.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.75.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.75.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.76.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.76.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.76.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.76.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.76.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.77.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.77.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.77.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.77.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.77.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.78.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.78.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.78.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.78.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.78.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.79.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.79.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.79.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.79.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.79.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.80.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.80.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.80.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.80.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.80.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.81.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.81.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.81.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.81.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.81.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.82.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.82.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.82.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.82.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.82.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.83.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.83.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.83.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.83.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.83.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.84.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.84.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.84.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.84.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.84.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.85.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.85.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.85.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.85.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.85.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.86.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.86.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.86.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.86.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.86.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.87.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.87.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.87.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.87.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.87.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.88.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.88.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.88.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.88.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.88.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.89.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.89.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.89.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.89.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.89.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.90.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.90.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.90.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.90.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.90.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.91.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.91.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.91.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.91.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.91.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.92.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.92.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.92.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.92.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.92.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.93.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.93.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.93.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.93.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.93.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.94.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.94.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.94.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.94.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.94.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.95.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.95.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.95.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.95.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.95.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.96.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.96.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.96.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.96.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.96.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.97.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.97.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.97.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.97.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.97.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.98.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.98.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.98.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.98.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.98.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.99.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.99.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.99.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.99.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.99.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.100.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.100.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.100.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.100.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.100.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.101.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.101.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.101.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.101.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.101.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.102.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.102.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.102.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.102.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.102.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.103.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.103.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.103.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.103.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.103.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.104.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.104.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.104.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.104.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.104.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.105.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.105.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.105.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.105.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.105.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.106.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.106.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.106.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.106.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.106.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.107.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.107.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.107.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.107.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.107.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.108.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.108.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.108.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.108.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.108.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.109.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.109.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.109.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.109.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.109.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.110.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.110.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.110.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.110.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.110.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.111.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.111.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.111.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.111.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.111.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.112.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.112.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.112.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.112.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.112.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.113.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.113.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.113.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.113.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.113.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.114.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.114.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.114.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.114.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.114.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.115.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.115.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.115.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.115.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.115.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.116.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.116.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.116.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.116.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.116.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.117.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.117.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.117.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.117.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.117.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.118.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.118.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.118.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.118.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.118.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.119.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.119.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.119.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.119.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.119.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.120.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.120.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.120.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.120.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.120.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.121.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.121.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.121.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.121.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.121.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.122.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.122.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.122.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.122.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.122.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.123.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.123.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.123.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.123.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.123.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.124.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.124.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.124.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.124.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.124.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.125.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.125.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.125.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.125.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.125.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.126.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.126.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.126.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.126.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.126.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.127.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.127.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.127.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.127.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.127.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.128.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.128.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.128.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.128.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.128.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.129.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.129.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.129.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.129.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.129.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.130.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.130.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.130.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.130.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.130.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.131.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.131.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.131.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.131.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.131.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.132.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.132.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.132.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.132.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.132.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.133.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.133.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.133.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.133.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.133.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.134.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.134.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.134.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.134.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.134.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.135.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.135.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.135.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.135.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.135.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.136.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.136.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.136.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.136.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.136.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.137.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.137.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.137.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.137.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.137.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.138.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.138.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.138.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.138.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.138.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.139.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.139.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.139.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.139.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.139.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.140.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.140.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.140.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.140.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.140.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.141.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.141.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.141.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.141.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.141.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.142.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.142.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.142.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.142.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.142.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.143.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.143.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.143.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.143.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.143.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.144.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.144.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.144.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.144.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.144.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.145.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.145.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.145.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.145.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.145.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.146.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.146.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.146.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.146.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.146.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.147.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.147.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.147.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.147.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.147.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.148.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.148.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.148.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.148.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.148.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.149.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.149.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.149.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.149.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.149.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.150.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.150.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.150.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.150.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.150.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.151.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.151.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.151.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.151.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.151.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.152.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.152.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.152.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.152.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.152.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.153.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.153.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.153.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.153.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.153.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.154.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.154.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.154.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.154.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.154.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.155.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.155.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.155.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.155.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.155.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.156.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.156.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.156.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.156.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.156.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.157.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.157.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.157.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.157.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.157.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.158.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.158.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.158.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.158.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.158.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.159.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.159.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.159.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.159.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.159.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.160.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.160.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.160.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.160.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.160.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.160.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.161.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.161.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.161.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.161.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.161.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.161.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.162.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.162.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.162.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.162.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.162.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.162.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.163.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.163.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.163.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.163.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.163.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.163.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.164.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.164.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.164.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.164.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.164.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.164.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.165.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.165.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.165.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.165.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.165.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.165.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.166.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.166.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.166.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.166.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.166.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.166.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.167.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.167.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.167.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.167.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.167.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.167.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.168.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.168.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.168.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.168.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.168.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.168.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.169.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.169.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.169.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.169.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.169.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.169.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.170.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.170.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.170.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.170.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.170.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.170.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.171.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.171.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.171.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.171.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.171.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.171.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.172.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.172.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.172.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.172.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.172.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.172.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.173.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.173.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.173.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.173.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.173.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.173.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.174.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.174.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.174.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.174.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.174.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.174.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.175.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.175.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.175.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.175.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.175.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.175.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.176.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.176.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.176.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.176.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.176.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.176.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.177.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.177.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.177.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.177.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.177.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.177.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.178.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.178.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.178.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.178.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.178.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.178.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.179.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.179.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.179.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.179.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.179.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.179.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.180.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.180.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.180.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.180.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.180.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.180.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.181.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.181.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.181.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.181.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.181.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.181.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.182.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.182.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.182.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.182.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.182.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.182.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.183.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.183.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.183.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.183.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.183.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.183.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.184.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.184.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.184.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.184.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.184.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.184.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.185.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.185.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.185.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.185.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.185.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.185.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.186.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.186.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.186.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.186.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.186.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.186.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.187.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.187.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.187.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.187.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.187.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.187.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.188.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.188.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.188.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.188.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.188.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.188.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.189.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.189.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.189.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.189.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.189.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.189.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.190.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.190.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.190.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.190.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.190.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.190.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.191.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.191.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.191.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.191.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.191.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.191.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.192.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.192.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.192.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.192.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.192.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.192.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.193.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.193.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.193.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.193.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.193.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.193.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.194.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.194.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.194.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.194.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.194.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.194.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.195.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.195.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.195.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.195.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.195.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.195.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.196.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.196.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.196.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.196.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.196.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.196.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.197.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.197.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.197.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.197.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.197.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.197.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.198.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.198.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.198.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.198.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.198.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.198.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.199.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.199.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.199.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.199.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.199.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.199.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.200.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.200.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.200.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.200.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.200.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.200.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.201.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.201.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.201.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.201.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.201.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.201.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.202.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.202.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.202.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.202.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.202.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.202.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.203.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.203.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.203.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.203.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.203.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.203.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.204.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.204.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.204.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.204.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.204.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.204.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.205.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.205.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.205.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.205.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.205.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.205.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.206.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.206.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.206.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.206.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.206.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.206.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.207.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.207.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.207.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.207.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.207.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.207.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.208.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.208.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.208.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.208.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.208.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.208.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.209.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.209.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.209.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.209.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.209.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.209.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.210.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.210.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.210.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.210.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.210.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.210.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.211.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.211.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.211.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.211.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.211.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.211.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.212.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.212.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.212.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.212.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.212.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.212.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.213.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.213.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.213.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.213.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.213.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.213.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.214.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.214.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.214.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.214.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.214.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.214.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.215.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.215.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.215.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.215.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.215.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.215.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.216.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.216.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.216.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.216.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.216.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.216.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.217.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.217.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.217.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.217.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.217.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.217.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.218.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.218.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.218.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.218.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.218.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.218.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.219.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.219.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.219.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.219.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.219.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.219.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.220.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.220.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.220.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.220.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.220.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.220.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.221.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.221.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.221.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.221.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.221.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.221.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.222.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.222.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.222.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.222.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.222.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.222.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.223.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.223.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.223.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.223.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.223.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.223.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.224.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.224.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.224.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.224.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.224.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.224.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.225.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.225.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.225.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.225.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.225.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.225.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.226.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.226.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.226.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.226.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.226.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.226.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.227.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.227.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.227.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.227.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.227.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.227.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.228.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.228.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.228.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.228.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.228.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.228.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.229.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.229.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.229.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.229.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.229.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.229.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.230.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.230.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.230.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.230.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.230.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.230.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.231.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.231.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.231.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.231.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.231.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.231.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.232.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.232.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.232.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.232.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.232.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.232.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.233.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.233.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.233.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.233.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.233.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.233.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.234.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.234.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.234.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.234.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.234.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.234.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.235.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.235.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.235.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.235.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.235.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.235.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.236.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.236.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.236.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.236.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.236.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.236.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.237.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.237.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.237.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.237.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.237.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.237.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.238.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.238.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.238.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.238.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.238.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.238.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.239.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.239.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.239.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.239.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.239.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.239.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.240.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.240.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.240.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.240.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.240.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.240.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.241.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.241.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.241.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.241.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.241.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.241.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.242.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.242.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.242.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.242.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.242.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.242.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.243.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.243.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.243.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.243.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.243.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.243.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.244.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.244.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.244.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.244.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.244.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.244.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.245.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.245.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.245.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.245.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.245.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.245.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.246.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.246.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.246.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.246.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.246.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.246.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.247.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.247.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.247.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.247.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.247.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.247.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.248.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.248.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.248.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.248.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.248.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.248.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.249.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.249.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.249.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.249.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.249.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.249.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.250.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.250.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.250.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.250.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.250.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.250.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.251.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.251.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.251.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.251.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.251.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.251.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.252.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.252.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.252.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.252.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.252.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.252.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.253.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.253.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.253.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.253.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.253.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.253.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.254.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.254.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.254.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.254.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.254.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.254.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.255.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.255.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.255.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.255.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.255.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.255.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.input_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.16.post_attention_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.q_a_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.q_a_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.q_a_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.q_b_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.q_b_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.kv_b_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.kv_b_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.o_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.o_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.gate.weight": "model-00040-of-000163.safetensors", "model.layers.17.mlp.gate.e_score_correction_bias": "model-00040-of-000163.safetensors", "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.shared_experts.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.shared_experts.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.0.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.0.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.0.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.0.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.0.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.1.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.1.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.1.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.1.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.1.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.2.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.2.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.2.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.2.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.2.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.3.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.3.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.3.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.3.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.3.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.4.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.4.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.4.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.4.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.4.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.5.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.5.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.5.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.5.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.5.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.6.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.6.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.6.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.6.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.6.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.7.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.7.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.7.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.7.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.7.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.8.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.8.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.8.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.8.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.8.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.9.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.9.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.9.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.9.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.9.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.10.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.10.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.10.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.10.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.10.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.11.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.11.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.11.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.11.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.11.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.12.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.12.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.12.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.12.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.12.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.13.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.13.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.13.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.13.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.13.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.14.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.14.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.14.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.14.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.14.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.15.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.15.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.15.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.15.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.15.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.16.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.16.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.16.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.16.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.16.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.17.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.17.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.17.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.17.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.17.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.18.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.18.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.18.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.18.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.18.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.19.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.19.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.19.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.19.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.19.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.20.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.20.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.20.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.20.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.20.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.21.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.21.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.21.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.21.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.21.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.22.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.22.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.22.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.22.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.22.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.23.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.23.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.23.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.23.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.23.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.24.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.24.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.24.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.24.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.24.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.25.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.25.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.25.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.25.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.25.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.26.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.26.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.26.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.26.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.26.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.27.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.27.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.27.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.27.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.27.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.28.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.28.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.28.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.28.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.28.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.29.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.29.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.29.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.29.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.29.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.30.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.30.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.30.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.30.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.30.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.31.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.31.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.31.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.31.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.31.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.32.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.32.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.32.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.32.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.32.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.33.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.33.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.33.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.33.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.33.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.34.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.34.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.34.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.34.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.34.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.35.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.35.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.35.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.35.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.35.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.36.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.36.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.36.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.36.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.36.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.37.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.37.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.37.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.37.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.37.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.38.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.38.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.38.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.38.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.38.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.39.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.39.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.39.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.39.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.39.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.40.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.40.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.40.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.40.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.40.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.41.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.41.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.41.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.41.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.41.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.42.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.42.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.42.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.42.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.42.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.43.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.43.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.43.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.43.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.43.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.44.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.44.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.44.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.44.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.44.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.45.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.45.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.45.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.45.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.45.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.46.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.46.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.46.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.46.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.46.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.47.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.47.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.47.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.47.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.47.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.48.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.48.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.48.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.48.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.48.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.49.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.49.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.49.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.49.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.49.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.50.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.50.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.50.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.50.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.50.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.51.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.51.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.51.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.51.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.51.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.52.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.52.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.52.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.52.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.52.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.53.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.53.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.53.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.53.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.53.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.54.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.54.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.54.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.54.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.54.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.55.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.55.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.55.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.55.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.55.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.56.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.56.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.56.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.56.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.56.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.57.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.57.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.57.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.57.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.57.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.58.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.58.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.58.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.58.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.58.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.59.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.59.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.59.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.59.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.59.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.60.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.60.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.60.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.60.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.60.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.61.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.61.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.61.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.61.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.61.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.62.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.62.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.62.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.62.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.62.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.63.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.63.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.63.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.63.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.63.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.64.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.64.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.64.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.64.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.64.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.65.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.65.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.65.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.65.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.65.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.66.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.66.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.66.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.66.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.66.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.67.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.67.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.67.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.67.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.67.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.68.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.68.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.68.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.68.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.68.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.69.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.69.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.69.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.69.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.69.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.70.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.70.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.70.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.70.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.70.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.71.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.71.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.71.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.71.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.71.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.72.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.72.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.72.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.72.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.72.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.73.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.73.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.73.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.73.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.73.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.74.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.74.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.74.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.74.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.74.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.75.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.75.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.75.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.75.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.75.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.76.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.76.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.76.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.76.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.76.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.77.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.77.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.77.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.77.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.77.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.78.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.78.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.78.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.78.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.78.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.79.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.79.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.79.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.79.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.79.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.80.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.80.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.80.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.80.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.80.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.81.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.81.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.81.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.81.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.81.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.82.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.82.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.82.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.82.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.82.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.83.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.83.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.83.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.83.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.83.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.84.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.84.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.84.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.84.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.84.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.85.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.85.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.85.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.85.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.85.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.86.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.86.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.86.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.86.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.86.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.87.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.87.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.87.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.87.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.87.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.88.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.88.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.88.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.88.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.88.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.89.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.89.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.89.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.89.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.89.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.90.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.90.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.90.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.90.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.90.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.91.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.91.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.91.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.91.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.91.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.92.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.92.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.92.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.92.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.92.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.93.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.93.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.93.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.93.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.93.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.94.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.94.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.94.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.94.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.94.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.95.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.95.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.95.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.95.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.95.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.96.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.96.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.96.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.96.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.96.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.97.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.97.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.97.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.97.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.97.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.98.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.98.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.98.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.98.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.98.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.99.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.99.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.99.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.99.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.99.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.100.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.100.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.100.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.100.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.100.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.101.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.101.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.101.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.101.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.101.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.102.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.102.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.102.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.102.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.102.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.103.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.103.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.103.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.103.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.103.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.104.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.104.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.104.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.104.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.104.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.105.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.105.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.105.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.105.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.105.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.106.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.106.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.106.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.106.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.106.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.107.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.107.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.107.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.107.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.107.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.108.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.108.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.108.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.108.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.108.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.109.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.109.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.109.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.109.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.109.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.110.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.110.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.110.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.110.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.110.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.111.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.111.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.111.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.111.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.111.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.112.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.112.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.112.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.112.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.112.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.113.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.113.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.113.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.113.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.113.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.114.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.114.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.114.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.114.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.114.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.115.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.115.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.115.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.115.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.115.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.116.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.116.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.116.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.116.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.116.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.117.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.117.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.117.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.117.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.117.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.118.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.118.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.118.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.118.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.118.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.119.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.119.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.119.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.119.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.119.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.120.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.120.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.120.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.120.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.120.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.121.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.121.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.121.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.121.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.121.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.122.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.122.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.122.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.122.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.122.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.123.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.123.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.123.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.123.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.123.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.124.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.124.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.124.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.124.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.124.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.125.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.125.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.125.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.125.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.125.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.126.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.126.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.126.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.126.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.126.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.127.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.127.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.127.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.127.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.127.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.128.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.128.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.128.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.128.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.128.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.129.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.129.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.129.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.129.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.129.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.130.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.130.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.130.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.130.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.130.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.131.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.131.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.131.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.131.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.131.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.132.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.132.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.132.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.132.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.132.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.133.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.133.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.133.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.133.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.133.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.134.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.134.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.134.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.134.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.134.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.135.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.135.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.135.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.135.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.135.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.136.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.136.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.136.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.136.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.136.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.137.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.137.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.137.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.137.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.137.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.138.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.138.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.138.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.138.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.138.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.139.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.139.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.139.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.139.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.139.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.140.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.140.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.140.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.140.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.140.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.141.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.141.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.141.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.141.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.141.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.142.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.142.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.142.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.142.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.142.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.143.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.143.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.143.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.143.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.143.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.144.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.144.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.144.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.144.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.144.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.145.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.145.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.145.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.145.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.145.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.146.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.146.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.146.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.146.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.146.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.147.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.147.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.147.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.147.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.147.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.148.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.148.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.148.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.148.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.148.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.149.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.149.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.149.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.149.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.149.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.150.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.150.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.150.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.150.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.150.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.151.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.151.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.151.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.151.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.151.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.152.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.152.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.152.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.152.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.152.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.153.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.153.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.153.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.153.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.153.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.154.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.154.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.154.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.154.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.154.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.155.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.155.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.155.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.155.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.155.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.156.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.156.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.156.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.156.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.156.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.157.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.157.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.157.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.157.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.157.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.158.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.158.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.158.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.158.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.158.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.159.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.159.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.159.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.159.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.159.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.160.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.160.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.160.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.160.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.160.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.160.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.161.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.161.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.161.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.161.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.161.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.161.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.162.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.162.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.162.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.162.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.162.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.162.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.163.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.163.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.163.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.163.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.163.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.163.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.164.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.164.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.164.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.164.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.164.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.164.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.165.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.165.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.165.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.165.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.165.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.165.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.166.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.166.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.166.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.166.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.166.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.166.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.167.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.167.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.167.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.167.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.167.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.167.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.168.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.168.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.168.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.168.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.168.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.168.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.169.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.169.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.169.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.169.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.169.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.169.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.170.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.170.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.170.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.170.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.170.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.170.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.171.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.171.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.171.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.171.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.171.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.171.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.172.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.172.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.172.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.172.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.172.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.172.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.173.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.173.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.173.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.173.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.173.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.173.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.174.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.174.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.174.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.174.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.174.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.174.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.175.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.175.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.175.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.175.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.175.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.175.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.176.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.176.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.176.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.176.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.176.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.176.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.177.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.177.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.177.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.177.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.177.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.177.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.178.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.178.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.178.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.178.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.178.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.178.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.179.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.179.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.179.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.179.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.179.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.179.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.180.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.180.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.180.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.180.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.180.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.180.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.181.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.181.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.181.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.181.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.181.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.181.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.182.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.182.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.182.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.182.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.182.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.182.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.183.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.183.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.183.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.183.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.183.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.183.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.184.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.184.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.184.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.184.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.184.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.184.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.185.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.185.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.185.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.185.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.185.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.185.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.186.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.186.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.186.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.186.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.186.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.186.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.187.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.187.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.187.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.187.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.187.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.187.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.188.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.188.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.188.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.188.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.188.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.188.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.189.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.189.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.189.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.189.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.189.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.189.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.190.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.190.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.190.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.190.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.190.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.190.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.191.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.191.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.191.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.191.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.191.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.191.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.192.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.192.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.192.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.192.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.192.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.192.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.193.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.193.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.193.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.193.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.193.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.193.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.194.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.194.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.194.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.194.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.194.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.194.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.195.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.195.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.195.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.195.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.195.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.195.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.196.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.196.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.196.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.196.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.196.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.196.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.197.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.197.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.197.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.197.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.197.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.197.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.198.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.198.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.198.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.198.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.198.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.198.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.199.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.199.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.199.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.199.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.199.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.199.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.200.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.200.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.200.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.200.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.200.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.200.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.201.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.201.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.201.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.201.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.201.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.201.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.202.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.202.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.202.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.202.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.202.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.202.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.203.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.203.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.203.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.203.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.203.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.203.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.204.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.204.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.204.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.204.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.204.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.204.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.205.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.205.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.205.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.205.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.205.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.205.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.206.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.206.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.206.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.206.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.206.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.206.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.207.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.207.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.207.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.207.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.207.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.207.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.208.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.208.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.208.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.208.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.208.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.208.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.209.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.209.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.209.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.209.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.209.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.209.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.210.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.210.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.210.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.210.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.210.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.210.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.211.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.211.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.211.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.211.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.211.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.211.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.212.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.212.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.212.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.212.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.212.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.212.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.213.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.213.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.213.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.213.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.213.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.213.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.214.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.214.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.214.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.214.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.214.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.214.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.215.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.215.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.215.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.215.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.215.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.215.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.216.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.216.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.216.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.216.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.216.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.216.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.217.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.217.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.217.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.217.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.217.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.217.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.218.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.218.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.218.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.218.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.218.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.218.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.219.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.219.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.219.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.219.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.219.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.219.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.220.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.220.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.220.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.220.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.220.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.220.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.221.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.221.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.221.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.221.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.221.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.221.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.222.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.222.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.222.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.222.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.222.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.222.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.223.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.223.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.223.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.223.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.223.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.223.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.224.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.224.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.224.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.224.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.224.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.224.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.225.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.225.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.225.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.225.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.225.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.225.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.226.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.226.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.226.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.226.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.226.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.226.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.227.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.227.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.227.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.227.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.227.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.227.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.228.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.228.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.228.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.228.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.228.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.228.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.229.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.229.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.229.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.229.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.229.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.229.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.230.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.230.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.230.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.230.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.230.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.230.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.231.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.231.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.231.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.231.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.231.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.231.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.232.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.232.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.232.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.232.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.232.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.232.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.233.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.233.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.233.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.233.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.233.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.233.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.234.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.234.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.234.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.234.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.234.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.234.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.235.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.235.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.235.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.235.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.235.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.235.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.236.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.236.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.236.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.236.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.236.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.236.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.237.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.237.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.237.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.237.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.237.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.237.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.238.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.238.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.238.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.238.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.238.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.238.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.239.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.239.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.239.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.239.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.239.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.239.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.240.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.240.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.240.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.240.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.240.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.240.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.241.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.241.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.241.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.241.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.241.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.241.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.242.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.242.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.242.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.242.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.242.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.242.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.243.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.243.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.243.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.243.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.243.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.243.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.244.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.244.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.244.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.244.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.244.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.244.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.245.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.245.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.245.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.245.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.245.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.245.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.246.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.246.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.246.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.246.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.246.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.246.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.247.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.247.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.247.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.247.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.247.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.247.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.248.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.248.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.248.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.248.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.248.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.248.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.249.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.249.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.249.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.249.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.249.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.249.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.250.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.250.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.250.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.250.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.250.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.250.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.251.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.251.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.251.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.251.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.251.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.251.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.252.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.252.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.252.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.252.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.252.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.252.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.253.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.253.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.253.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.253.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.253.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.253.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.254.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.254.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.254.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.254.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.254.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.254.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.255.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.255.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.255.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.255.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.255.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.255.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.input_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.17.post_attention_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.q_a_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.q_a_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.q_a_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.q_b_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.q_b_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.kv_b_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.kv_b_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.o_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.o_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.gate.weight": "model-00043-of-000163.safetensors", "model.layers.18.mlp.gate.e_score_correction_bias": "model-00043-of-000163.safetensors", "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.shared_experts.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.shared_experts.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.0.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.0.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.0.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.0.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.0.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.1.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.1.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.1.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.1.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.1.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.2.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.2.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.2.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.2.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.2.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.3.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.3.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.3.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.3.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.3.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.4.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.4.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.4.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.4.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.4.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.5.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.5.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.5.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.5.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.5.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.6.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.6.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.6.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.6.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.6.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.7.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.7.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.7.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.7.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.7.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.8.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.8.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.8.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.8.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.8.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.9.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.9.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.9.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.9.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.9.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.10.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.10.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.10.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.10.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.10.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.11.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.11.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.11.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.11.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.11.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.12.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.12.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.12.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.12.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.12.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.13.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.13.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.13.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.13.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.13.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.14.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.14.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.14.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.14.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.14.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.15.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.15.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.15.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.15.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.15.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.16.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.16.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.16.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.16.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.16.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.17.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.17.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.17.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.17.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.17.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.18.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.18.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.18.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.18.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.18.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.19.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.19.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.19.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.19.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.19.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.20.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.20.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.20.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.20.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.20.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.21.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.21.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.21.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.21.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.21.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.22.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.22.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.22.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.22.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.22.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.23.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.23.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.23.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.23.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.23.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.24.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.24.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.24.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.24.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.24.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.25.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.25.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.25.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.25.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.25.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.26.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.26.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.26.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.26.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.26.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.27.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.27.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.27.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.27.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.27.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.28.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.28.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.28.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.28.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.28.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.29.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.29.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.29.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.29.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.29.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.30.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.30.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.30.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.30.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.30.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.31.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.31.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.31.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.31.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.31.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.32.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.32.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.32.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.32.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.32.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.33.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.33.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.33.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.33.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.33.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.34.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.34.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.34.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.34.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.34.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.35.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.35.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.35.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.35.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.35.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.36.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.36.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.36.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.36.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.36.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.37.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.37.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.37.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.37.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.37.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.38.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.38.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.38.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.38.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.38.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.39.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.39.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.39.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.39.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.39.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.40.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.40.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.40.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.40.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.40.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.41.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.41.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.41.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.41.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.41.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.42.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.42.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.42.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.42.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.42.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.43.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.43.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.43.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.43.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.43.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.44.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.44.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.44.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.44.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.44.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.45.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.45.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.45.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.45.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.45.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.46.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.46.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.46.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.46.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.46.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.47.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.47.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.47.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.47.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.47.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.48.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.48.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.48.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.48.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.48.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.49.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.49.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.49.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.49.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.49.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.50.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.50.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.50.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.50.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.50.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.51.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.51.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.51.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.51.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.51.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.52.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.52.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.52.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.52.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.52.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.53.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.53.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.53.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.53.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.53.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.54.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.54.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.54.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.54.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.54.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.55.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.55.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.55.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.55.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.55.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.56.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.56.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.56.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.56.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.56.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.57.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.57.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.57.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.57.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.57.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.58.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.58.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.58.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.58.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.58.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.59.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.59.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.59.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.59.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.59.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.60.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.60.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.60.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.60.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.60.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.61.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.61.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.61.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.61.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.61.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.62.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.62.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.62.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.62.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.62.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.63.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.63.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.63.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.63.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.63.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.64.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.64.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.64.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.64.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.64.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.65.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.65.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.65.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.65.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.65.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.66.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.66.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.66.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.66.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.66.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.67.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.67.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.67.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.67.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.67.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.68.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.68.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.68.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.68.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.68.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.69.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.69.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.69.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.69.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.69.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.70.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.70.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.70.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.70.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.70.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.71.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.71.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.71.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.71.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.71.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.72.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.72.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.72.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.72.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.72.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.73.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.73.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.73.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.73.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.73.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.74.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.74.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.74.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.74.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.74.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.75.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.75.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.75.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.75.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.75.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.76.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.76.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.76.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.76.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.76.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.77.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.77.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.77.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.77.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.77.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.78.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.78.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.78.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.78.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.78.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.79.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.79.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.79.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.79.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.79.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.80.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.80.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.80.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.80.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.80.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.81.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.81.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.81.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.81.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.81.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.82.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.82.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.82.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.82.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.82.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.83.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.83.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.83.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.83.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.83.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.84.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.84.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.84.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.84.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.84.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.85.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.85.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.85.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.85.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.85.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.86.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.86.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.86.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.86.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.86.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.87.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.87.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.87.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.87.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.87.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.88.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.88.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.88.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.88.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.88.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.89.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.89.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.89.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.89.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.89.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.90.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.90.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.90.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.90.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.90.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.91.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.91.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.91.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.91.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.91.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.92.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.92.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.92.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.92.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.92.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.93.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.93.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.93.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.93.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.93.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.94.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.94.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.94.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.94.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.94.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.95.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.95.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.95.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.95.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.95.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.96.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.96.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.96.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.96.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.96.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.97.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.97.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.97.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.97.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.97.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.98.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.98.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.98.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.98.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.98.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.99.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.99.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.99.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.99.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.99.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.100.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.100.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.100.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.100.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.100.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.101.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.101.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.101.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.101.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.101.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.102.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.102.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.102.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.102.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.102.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.103.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.103.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.103.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.103.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.103.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.104.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.104.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.104.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.104.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.104.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.105.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.105.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.105.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.105.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.105.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.106.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.106.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.106.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.106.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.106.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.107.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.107.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.107.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.107.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.107.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.108.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.108.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.108.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.108.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.108.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.109.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.109.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.109.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.109.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.109.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.110.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.110.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.110.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.110.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.110.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.111.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.111.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.111.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.111.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.111.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.112.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.112.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.112.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.112.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.112.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.113.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.113.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.113.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.113.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.113.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.114.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.114.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.114.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.114.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.114.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.115.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.115.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.115.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.115.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.115.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.116.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.116.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.116.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.116.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.116.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.117.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.117.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.117.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.117.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.117.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.118.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.118.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.118.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.118.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.118.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.119.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.119.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.119.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.119.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.119.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.120.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.120.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.120.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.120.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.120.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.121.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.121.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.121.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.121.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.121.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.122.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.122.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.122.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.122.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.122.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.123.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.123.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.123.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.123.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.123.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.124.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.124.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.124.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.124.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.124.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.125.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.125.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.125.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.125.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.125.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.126.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.126.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.126.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.126.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.126.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.127.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.127.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.127.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.127.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.127.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.128.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.128.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.128.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.128.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.128.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.129.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.129.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.129.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.129.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.129.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.130.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.130.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.130.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.130.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.130.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.131.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.131.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.131.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.131.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.131.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.132.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.132.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.132.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.132.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.132.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.133.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.133.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.133.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.133.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.133.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.134.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.134.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.134.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.134.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.134.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.135.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.135.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.135.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.135.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.135.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.136.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.136.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.136.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.136.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.136.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.137.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.137.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.137.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.137.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.137.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.138.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.138.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.138.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.138.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.138.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.139.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.139.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.139.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.139.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.139.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.140.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.140.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.140.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.140.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.140.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.141.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.141.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.141.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.141.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.141.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.142.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.142.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.142.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.142.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.142.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.143.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.143.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.143.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.143.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.143.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.144.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.144.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.144.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.144.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.144.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.145.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.145.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.145.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.145.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.145.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.146.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.146.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.146.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.146.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.146.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.147.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.147.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.147.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.147.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.147.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.148.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.148.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.148.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.148.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.148.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.149.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.149.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.149.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.149.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.149.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.150.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.150.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.150.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.150.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.150.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.151.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.151.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.151.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.151.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.151.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.152.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.152.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.152.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.152.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.152.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.153.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.153.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.153.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.153.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.153.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.154.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.154.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.154.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.154.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.154.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.155.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.155.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.155.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.155.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.155.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.156.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.156.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.156.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.156.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.156.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.157.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.157.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.157.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.157.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.157.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.158.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.158.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.158.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.158.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.158.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.159.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.159.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.159.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.159.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.159.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.160.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.160.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.160.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.160.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.160.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.160.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.161.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.161.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.161.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.161.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.161.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.161.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.162.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.162.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.162.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.162.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.162.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.162.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.163.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.163.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.163.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.163.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.163.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.163.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.164.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.164.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.164.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.164.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.164.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.164.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.165.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.165.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.165.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.165.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.165.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.165.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.166.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.166.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.166.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.166.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.166.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.166.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.167.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.167.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.167.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.167.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.167.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.167.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.168.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.168.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.168.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.168.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.168.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.168.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.169.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.169.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.169.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.169.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.169.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.169.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.170.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.170.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.170.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.170.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.170.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.170.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.171.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.171.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.171.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.171.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.171.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.171.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.172.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.172.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.172.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.172.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.172.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.172.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.173.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.173.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.173.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.173.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.173.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.173.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.174.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.174.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.174.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.174.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.174.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.174.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.175.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.175.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.175.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.175.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.175.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.175.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.176.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.176.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.176.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.176.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.176.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.176.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.177.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.177.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.177.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.177.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.177.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.177.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.178.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.178.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.178.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.178.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.178.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.178.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.179.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.179.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.179.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.179.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.179.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.179.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.180.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.180.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.180.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.180.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.180.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.180.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.181.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.181.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.181.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.181.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.181.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.181.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.182.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.182.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.182.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.182.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.182.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.182.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.183.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.183.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.183.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.183.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.183.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.183.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.184.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.184.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.184.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.184.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.184.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.184.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.185.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.185.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.185.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.185.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.185.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.185.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.186.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.186.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.186.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.186.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.186.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.186.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.187.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.187.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.187.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.187.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.187.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.187.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.188.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.188.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.188.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.188.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.188.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.188.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.189.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.189.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.189.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.189.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.189.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.189.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.190.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.190.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.190.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.190.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.190.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.190.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.191.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.191.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.191.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.191.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.191.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.191.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.192.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.192.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.192.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.192.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.192.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.192.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.193.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.193.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.193.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.193.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.193.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.193.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.194.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.194.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.194.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.194.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.194.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.194.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.195.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.195.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.195.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.195.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.195.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.195.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.196.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.196.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.196.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.196.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.196.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.196.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.197.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.197.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.197.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.197.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.197.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.197.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.198.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.198.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.198.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.198.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.198.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.198.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.199.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.199.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.199.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.199.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.199.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.199.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.200.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.200.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.200.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.200.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.200.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.200.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.201.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.201.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.201.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.201.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.201.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.201.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.202.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.202.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.202.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.202.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.202.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.202.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.203.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.203.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.203.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.203.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.203.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.203.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.204.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.204.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.204.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.204.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.204.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.204.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.205.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.205.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.205.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.205.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.205.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.205.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.206.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.206.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.206.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.206.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.206.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.206.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.207.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.207.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.207.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.207.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.207.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.207.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.208.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.208.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.208.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.208.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.208.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.208.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.209.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.209.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.209.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.209.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.209.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.209.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.210.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.210.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.210.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.210.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.210.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.210.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.211.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.211.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.211.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.211.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.211.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.211.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.212.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.212.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.212.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.212.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.212.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.212.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.213.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.213.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.213.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.213.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.213.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.213.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.214.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.214.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.214.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.214.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.214.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.214.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.215.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.215.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.215.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.215.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.215.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.215.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.216.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.216.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.216.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.216.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.216.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.216.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.217.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.217.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.217.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.217.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.217.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.217.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.218.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.218.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.218.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.218.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.218.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.218.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.219.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.219.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.219.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.219.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.219.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.219.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.220.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.220.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.220.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.220.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.220.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.220.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.221.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.221.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.221.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.221.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.221.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.221.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.222.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.222.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.222.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.222.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.222.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.222.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.223.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.223.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.223.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.223.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.223.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.223.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.224.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.224.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.224.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.224.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.224.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.224.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.225.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.225.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.225.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.225.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.225.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.225.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.226.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.226.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.226.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.226.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.226.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.226.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.227.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.227.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.227.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.227.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.227.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.227.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.228.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.228.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.228.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.228.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.228.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.228.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.229.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.229.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.229.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.229.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.229.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.229.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.230.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.230.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.230.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.230.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.230.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.230.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.231.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.231.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.231.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.231.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.231.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.231.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.232.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.232.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.232.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.232.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.232.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.232.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.233.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.233.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.233.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.233.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.233.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.233.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.234.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.234.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.234.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.234.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.234.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.234.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.235.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.235.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.235.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.235.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.235.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.235.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.236.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.236.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.236.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.236.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.236.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.236.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.237.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.237.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.237.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.237.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.237.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.237.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.238.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.238.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.238.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.238.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.238.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.238.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.239.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.239.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.239.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.239.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.239.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.239.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.240.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.240.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.240.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.240.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.240.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.240.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.241.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.241.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.241.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.241.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.241.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.241.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.242.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.242.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.242.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.242.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.242.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.242.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.243.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.243.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.243.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.243.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.243.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.243.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.244.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.244.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.244.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.244.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.244.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.244.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.245.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.245.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.245.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.245.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.245.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.245.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.246.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.246.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.246.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.246.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.246.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.246.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.247.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.247.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.247.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.247.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.247.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.247.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.248.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.248.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.248.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.248.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.248.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.248.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.249.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.249.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.249.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.249.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.249.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.249.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.250.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.250.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.250.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.250.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.250.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.250.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.251.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.251.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.251.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.251.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.251.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.251.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.252.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.252.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.252.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.252.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.252.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.252.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.253.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.253.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.253.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.253.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.253.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.253.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.254.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.254.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.254.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.254.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.254.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.254.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.255.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.255.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.255.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.255.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.255.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.255.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.input_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.18.post_attention_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.q_a_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.q_a_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.q_a_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.q_b_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.q_b_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.kv_b_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.kv_b_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.o_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.o_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.gate.weight": "model-00045-of-000163.safetensors", "model.layers.19.mlp.gate.e_score_correction_bias": "model-00045-of-000163.safetensors", "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.shared_experts.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.shared_experts.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.0.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.0.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.0.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.0.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.0.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.1.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.1.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.1.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.1.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.1.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.2.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.2.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.2.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.2.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.2.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.3.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.3.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.3.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.3.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.3.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.4.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.4.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.4.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.4.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.4.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.5.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.5.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.5.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.5.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.5.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.6.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.6.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.6.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.6.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.6.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.7.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.7.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.7.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.7.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.7.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.8.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.8.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.8.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.8.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.8.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.9.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.9.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.9.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.9.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.9.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.10.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.10.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.10.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.10.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.10.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.11.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.11.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.11.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.11.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.11.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.12.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.12.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.12.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.12.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.12.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.13.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.13.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.13.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.13.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.13.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.14.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.14.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.14.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.14.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.14.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.15.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.15.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.15.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.15.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.15.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.16.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.16.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.16.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.16.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.16.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.17.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.17.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.17.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.17.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.17.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.18.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.18.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.18.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.18.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.18.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.19.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.19.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.19.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.19.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.19.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.20.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.20.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.20.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.20.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.20.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.21.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.21.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.21.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.21.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.21.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.22.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.22.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.22.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.22.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.22.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.23.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.23.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.23.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.23.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.23.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.24.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.24.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.24.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.24.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.24.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.25.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.25.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.25.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.25.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.25.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.26.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.26.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.26.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.26.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.26.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.27.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.27.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.27.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.27.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.27.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.28.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.28.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.28.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.28.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.28.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.29.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.29.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.29.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.29.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.29.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.30.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.30.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.30.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.30.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.30.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.31.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.31.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.31.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.31.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.31.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.32.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.32.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.32.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.32.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.32.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.33.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.33.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.33.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.33.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.33.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.34.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.34.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.34.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.34.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.34.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.35.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.35.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.35.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.35.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.35.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.36.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.36.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.36.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.36.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.36.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.37.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.37.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.37.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.37.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.37.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.38.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.38.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.38.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.38.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.38.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.39.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.39.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.39.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.39.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.39.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.40.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.40.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.40.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.40.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.40.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.41.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.41.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.41.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.41.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.41.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.42.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.42.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.42.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.42.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.42.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.43.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.43.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.43.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.43.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.43.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.44.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.44.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.44.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.44.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.44.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.45.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.45.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.45.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.45.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.45.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.46.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.46.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.46.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.46.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.46.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.47.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.47.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.47.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.47.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.47.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.48.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.48.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.48.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.48.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.48.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.49.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.49.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.49.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.49.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.49.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.50.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.50.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.50.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.50.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.50.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.51.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.51.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.51.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.51.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.51.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.52.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.52.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.52.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.52.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.52.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.53.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.53.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.53.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.53.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.53.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.54.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.54.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.54.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.54.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.54.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.55.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.55.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.55.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.55.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.55.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.56.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.56.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.56.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.56.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.56.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.57.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.57.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.57.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.57.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.57.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.58.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.58.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.58.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.58.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.58.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.59.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.59.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.59.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.59.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.59.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.60.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.60.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.60.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.60.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.60.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.61.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.61.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.61.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.61.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.61.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.62.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.62.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.62.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.62.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.62.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.63.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.63.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.63.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.63.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.63.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.64.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.64.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.64.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.64.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.64.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.65.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.65.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.65.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.65.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.65.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.66.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.66.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.66.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.66.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.66.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.67.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.67.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.67.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.67.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.67.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.68.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.68.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.68.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.68.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.68.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.69.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.69.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.69.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.69.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.69.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.70.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.70.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.70.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.70.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.70.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.71.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.71.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.71.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.71.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.71.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.72.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.72.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.72.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.72.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.72.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.73.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.73.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.73.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.73.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.73.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.74.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.74.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.74.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.74.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.74.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.75.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.75.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.75.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.75.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.75.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.76.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.76.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.76.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.76.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.76.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.77.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.77.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.77.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.77.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.77.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.78.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.78.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.78.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.78.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.78.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.79.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.79.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.79.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.79.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.79.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.80.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.80.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.80.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.80.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.80.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.81.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.81.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.81.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.81.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.81.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.82.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.82.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.82.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.82.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.82.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.83.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.83.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.83.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.83.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.83.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.84.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.84.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.84.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.84.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.84.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.85.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.85.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.85.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.85.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.85.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.86.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.86.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.86.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.86.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.86.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.87.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.87.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.87.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.87.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.87.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.88.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.88.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.88.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.88.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.88.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.89.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.89.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.89.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.89.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.89.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.90.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.90.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.90.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.90.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.90.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.91.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.91.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.91.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.91.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.91.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.92.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.92.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.92.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.92.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.92.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.93.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.93.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.93.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.93.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.93.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.94.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.94.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.94.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.94.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.94.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.95.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.95.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.95.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.95.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.95.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.96.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.96.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.96.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.96.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.96.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.97.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.97.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.97.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.97.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.97.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.98.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.98.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.98.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.98.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.98.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.99.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.99.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.99.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.99.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.99.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.100.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.100.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.100.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.100.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.100.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.101.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.101.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.101.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.101.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.101.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.102.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.102.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.102.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.102.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.102.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.103.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.103.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.103.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.103.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.103.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.104.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.104.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.104.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.104.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.104.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.105.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.105.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.105.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.105.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.105.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.106.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.106.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.106.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.106.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.106.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.107.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.107.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.107.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.107.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.107.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.108.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.108.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.108.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.108.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.108.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.109.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.109.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.109.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.109.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.109.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.110.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.110.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.110.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.110.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.110.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.111.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.111.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.111.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.111.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.111.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.112.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.112.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.112.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.112.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.112.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.113.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.113.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.113.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.113.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.113.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.114.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.114.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.114.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.114.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.114.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.115.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.115.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.115.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.115.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.115.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.116.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.116.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.116.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.116.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.116.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.117.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.117.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.117.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.117.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.117.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.118.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.118.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.118.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.118.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.118.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.119.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.119.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.119.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.119.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.119.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.120.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.120.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.120.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.120.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.120.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.121.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.121.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.121.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.121.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.121.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.122.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.122.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.122.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.122.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.122.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.123.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.123.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.123.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.123.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.123.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.124.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.124.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.124.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.124.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.124.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.125.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.125.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.125.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.125.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.125.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.126.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.126.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.126.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.126.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.126.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.127.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.127.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.127.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.127.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.127.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.128.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.128.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.128.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.128.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.128.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.129.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.129.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.129.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.129.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.129.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.130.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.130.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.130.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.130.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.130.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.131.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.131.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.131.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.131.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.131.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.132.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.132.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.132.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.132.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.132.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.133.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.133.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.133.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.133.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.133.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.134.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.134.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.134.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.134.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.134.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.135.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.135.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.135.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.135.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.135.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.136.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.136.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.136.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.136.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.136.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.137.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.137.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.137.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.137.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.137.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.138.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.138.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.138.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.138.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.138.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.139.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.139.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.139.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.139.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.139.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.140.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.140.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.140.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.140.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.140.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.141.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.141.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.141.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.141.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.141.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.142.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.142.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.142.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.142.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.142.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.143.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.143.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.143.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.143.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.143.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.144.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.144.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.144.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.144.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.144.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.145.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.145.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.145.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.145.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.145.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.146.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.146.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.146.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.146.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.146.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.147.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.147.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.147.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.147.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.147.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.148.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.148.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.148.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.148.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.148.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.149.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.149.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.149.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.149.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.149.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.150.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.150.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.150.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.150.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.150.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.151.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.151.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.151.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.151.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.151.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.152.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.152.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.152.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.152.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.152.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.153.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.153.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.153.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.153.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.153.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.154.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.154.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.154.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.154.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.154.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.155.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.155.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.155.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.155.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.155.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.156.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.156.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.156.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.156.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.156.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.157.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.157.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.157.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.157.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.157.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.158.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.158.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.158.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.158.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.158.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.159.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.159.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.159.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.159.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.159.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.160.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.160.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.160.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.160.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.160.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.160.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.161.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.161.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.161.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.161.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.161.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.161.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.162.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.162.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.162.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.162.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.162.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.162.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.163.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.163.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.163.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.163.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.163.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.163.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.164.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.164.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.164.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.164.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.164.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.164.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.165.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.165.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.165.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.165.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.165.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.165.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.166.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.166.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.166.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.166.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.166.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.166.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.167.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.167.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.167.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.167.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.167.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.167.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.168.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.168.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.168.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.168.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.168.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.168.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.169.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.169.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.169.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.169.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.169.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.169.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.170.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.170.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.170.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.170.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.170.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.170.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.171.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.171.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.171.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.171.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.171.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.171.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.172.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.172.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.172.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.172.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.172.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.172.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.173.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.173.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.173.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.173.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.173.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.173.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.174.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.174.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.174.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.174.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.174.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.174.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.175.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.175.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.175.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.175.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.175.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.175.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.176.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.176.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.176.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.176.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.176.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.176.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.177.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.177.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.177.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.177.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.177.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.177.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.178.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.178.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.178.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.178.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.178.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.178.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.179.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.179.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.179.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.179.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.179.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.179.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.180.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.180.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.180.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.180.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.180.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.180.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.181.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.181.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.181.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.181.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.181.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.181.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.182.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.182.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.182.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.182.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.182.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.182.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.183.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.183.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.183.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.183.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.183.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.183.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.184.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.184.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.184.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.184.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.184.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.184.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.185.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.185.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.185.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.185.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.185.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.185.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.186.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.186.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.186.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.186.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.186.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.186.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.187.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.187.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.187.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.187.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.187.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.187.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.188.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.188.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.188.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.188.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.188.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.188.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.189.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.189.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.189.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.189.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.189.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.189.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.190.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.190.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.190.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.190.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.190.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.190.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.191.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.191.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.191.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.191.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.191.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.191.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.192.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.192.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.192.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.192.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.192.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.192.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.193.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.193.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.193.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.193.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.193.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.193.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.194.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.194.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.194.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.194.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.194.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.194.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.195.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.195.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.195.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.195.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.195.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.195.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.196.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.196.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.196.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.196.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.196.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.196.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.197.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.197.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.197.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.197.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.197.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.197.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.198.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.198.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.198.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.198.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.198.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.198.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.199.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.199.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.199.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.199.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.199.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.199.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.200.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.200.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.200.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.200.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.200.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.200.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.201.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.201.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.201.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.201.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.201.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.201.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.202.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.202.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.202.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.202.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.202.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.202.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.203.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.203.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.203.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.203.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.203.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.203.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.204.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.204.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.204.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.204.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.204.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.204.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.205.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.205.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.205.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.205.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.205.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.205.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.206.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.206.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.206.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.206.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.206.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.206.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.207.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.207.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.207.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.207.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.207.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.207.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.208.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.208.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.208.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.208.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.208.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.208.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.209.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.209.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.209.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.209.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.209.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.209.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.210.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.210.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.210.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.210.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.210.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.210.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.211.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.211.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.211.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.211.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.211.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.211.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.212.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.212.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.212.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.212.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.212.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.212.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.213.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.213.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.213.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.213.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.213.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.213.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.214.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.214.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.214.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.214.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.214.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.214.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.215.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.215.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.215.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.215.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.215.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.215.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.216.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.216.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.216.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.216.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.216.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.216.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.217.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.217.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.217.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.217.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.217.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.217.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.218.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.218.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.218.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.218.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.218.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.218.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.219.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.219.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.219.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.219.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.219.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.219.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.220.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.220.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.220.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.220.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.220.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.220.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.221.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.221.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.221.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.221.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.221.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.221.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.222.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.222.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.222.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.222.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.222.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.222.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.223.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.223.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.223.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.223.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.223.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.223.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.224.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.224.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.224.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.224.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.224.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.224.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.225.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.225.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.225.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.225.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.225.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.225.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.226.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.226.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.226.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.226.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.226.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.226.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.227.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.227.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.227.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.227.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.227.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.227.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.228.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.228.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.228.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.228.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.228.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.228.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.229.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.229.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.229.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.229.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.229.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.229.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.230.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.230.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.230.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.230.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.230.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.230.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.231.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.231.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.231.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.231.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.231.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.231.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.232.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.232.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.232.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.232.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.232.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.232.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.233.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.233.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.233.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.233.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.233.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.233.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.234.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.234.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.234.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.234.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.234.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.234.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.235.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.235.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.235.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.235.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.235.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.235.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.236.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.236.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.236.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.236.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.236.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.236.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.237.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.237.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.237.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.237.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.237.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.237.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.238.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.238.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.238.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.238.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.238.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.238.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.239.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.239.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.239.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.239.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.239.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.239.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.240.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.240.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.240.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.240.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.240.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.240.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.241.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.241.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.241.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.241.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.241.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.241.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.242.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.242.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.242.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.242.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.242.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.242.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.243.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.243.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.243.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.243.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.243.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.243.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.244.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.244.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.244.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.244.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.244.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.244.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.245.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.245.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.245.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.245.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.245.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.245.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.246.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.246.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.246.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.246.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.246.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.246.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.247.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.247.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.247.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.247.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.247.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.247.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.248.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.248.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.248.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.248.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.248.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.248.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.249.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.249.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.249.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.249.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.249.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.249.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.250.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.250.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.250.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.250.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.250.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.250.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.251.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.251.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.251.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.251.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.251.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.251.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.252.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.252.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.252.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.252.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.252.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.252.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.253.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.253.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.253.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.253.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.253.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.253.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.254.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.254.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.254.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.254.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.254.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.254.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.255.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.255.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.255.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.255.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.255.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.255.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.input_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.19.post_attention_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.q_a_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.q_a_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.q_a_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.q_b_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.q_b_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.kv_b_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.kv_b_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.o_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.o_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.gate.weight": "model-00048-of-000163.safetensors", "model.layers.20.mlp.gate.e_score_correction_bias": "model-00048-of-000163.safetensors", "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.shared_experts.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.shared_experts.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.0.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.0.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.0.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.0.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.0.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.1.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.1.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.1.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.1.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.1.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.2.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.2.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.2.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.2.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.2.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.3.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.3.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.3.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.3.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.3.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.4.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.4.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.4.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.4.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.4.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.5.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.5.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.5.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.5.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.5.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.6.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.6.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.6.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.6.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.6.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.7.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.7.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.7.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.7.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.7.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.8.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.8.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.8.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.8.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.8.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.9.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.9.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.9.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.9.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.9.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.10.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.10.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.10.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.10.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.10.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.11.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.11.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.11.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.11.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.11.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.12.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.12.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.12.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.12.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.12.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.13.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.13.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.13.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.13.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.13.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.14.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.14.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.14.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.14.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.14.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.15.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.15.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.15.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.15.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.15.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.16.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.16.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.16.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.16.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.16.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.17.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.17.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.17.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.17.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.17.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.18.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.18.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.18.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.18.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.18.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.19.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.19.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.19.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.19.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.19.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.20.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.20.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.20.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.20.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.20.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.21.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.21.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.21.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.21.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.21.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.22.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.22.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.22.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.22.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.22.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.23.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.23.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.23.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.23.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.23.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.24.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.24.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.24.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.24.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.24.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.25.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.25.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.25.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.25.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.25.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.26.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.26.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.26.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.26.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.26.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.27.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.27.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.27.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.27.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.27.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.28.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.28.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.28.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.28.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.28.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.29.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.29.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.29.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.29.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.29.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.30.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.30.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.30.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.30.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.30.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.31.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.31.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.31.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.31.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.31.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.32.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.32.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.32.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.32.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.32.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.33.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.33.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.33.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.33.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.33.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.34.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.34.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.34.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.34.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.34.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.35.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.35.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.35.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.35.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.35.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.36.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.36.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.36.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.36.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.36.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.37.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.37.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.37.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.37.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.37.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.38.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.38.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.38.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.38.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.38.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.39.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.39.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.39.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.39.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.39.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.40.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.40.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.40.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.40.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.40.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.41.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.41.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.41.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.41.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.41.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.42.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.42.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.42.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.42.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.42.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.43.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.43.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.43.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.43.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.43.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.44.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.44.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.44.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.44.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.44.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.45.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.45.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.45.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.45.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.45.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.46.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.46.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.46.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.46.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.46.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.47.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.47.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.47.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.47.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.47.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.48.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.48.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.48.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.48.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.48.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.49.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.49.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.49.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.49.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.49.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.50.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.50.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.50.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.50.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.50.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.51.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.51.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.51.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.51.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.51.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.52.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.52.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.52.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.52.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.52.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.53.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.53.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.53.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.53.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.53.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.54.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.54.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.54.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.54.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.54.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.55.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.55.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.55.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.55.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.55.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.56.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.56.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.56.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.56.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.56.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.57.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.57.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.57.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.57.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.57.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.58.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.58.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.58.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.58.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.58.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.59.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.59.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.59.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.59.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.59.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.60.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.60.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.60.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.60.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.60.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.61.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.61.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.61.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.61.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.61.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.62.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.62.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.62.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.62.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.62.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.63.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.63.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.63.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.63.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.63.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.64.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.64.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.64.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.64.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.64.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.65.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.65.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.65.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.65.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.65.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.66.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.66.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.66.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.66.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.66.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.67.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.67.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.67.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.67.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.67.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.68.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.68.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.68.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.68.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.68.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.69.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.69.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.69.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.69.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.69.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.70.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.70.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.70.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.70.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.70.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.71.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.71.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.71.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.71.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.71.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.72.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.72.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.72.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.72.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.72.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.73.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.73.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.73.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.73.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.73.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.74.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.74.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.74.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.74.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.74.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.75.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.75.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.75.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.75.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.75.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.76.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.76.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.76.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.76.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.76.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.77.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.77.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.77.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.77.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.77.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.78.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.78.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.78.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.78.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.78.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.79.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.79.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.79.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.79.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.79.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.80.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.80.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.80.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.80.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.80.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.81.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.81.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.81.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.81.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.81.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.82.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.82.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.82.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.82.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.82.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.83.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.83.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.83.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.83.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.83.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.84.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.84.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.84.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.84.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.84.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.85.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.85.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.85.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.85.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.85.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.86.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.86.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.86.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.86.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.86.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.87.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.87.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.87.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.87.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.87.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.88.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.88.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.88.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.88.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.88.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.89.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.89.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.89.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.89.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.89.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.90.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.90.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.90.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.90.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.90.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.91.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.91.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.91.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.91.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.91.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.92.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.92.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.92.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.92.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.92.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.93.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.93.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.93.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.93.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.93.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.94.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.94.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.94.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.94.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.94.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.95.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.95.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.95.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.95.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.95.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.96.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.96.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.96.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.96.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.96.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.97.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.97.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.97.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.97.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.97.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.98.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.98.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.98.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.98.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.98.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.99.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.99.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.99.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.99.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.99.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.100.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.100.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.100.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.100.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.100.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.101.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.101.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.101.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.101.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.101.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.102.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.102.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.102.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.102.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.102.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.103.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.103.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.103.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.103.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.103.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.104.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.104.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.104.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.104.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.104.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.105.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.105.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.105.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.105.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.105.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.106.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.106.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.106.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.106.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.106.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.107.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.107.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.107.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.107.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.107.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.108.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.108.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.108.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.108.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.108.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.109.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.109.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.109.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.109.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.109.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.110.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.110.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.110.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.110.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.110.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.111.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.111.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.111.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.111.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.111.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.112.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.112.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.112.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.112.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.112.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.113.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.113.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.113.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.113.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.113.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.114.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.114.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.114.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.114.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.114.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.115.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.115.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.115.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.115.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.115.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.116.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.116.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.116.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.116.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.116.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.117.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.117.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.117.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.117.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.117.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.118.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.118.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.118.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.118.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.118.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.119.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.119.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.119.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.119.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.119.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.120.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.120.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.120.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.120.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.120.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.121.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.121.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.121.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.121.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.121.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.122.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.122.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.122.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.122.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.122.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.123.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.123.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.123.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.123.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.123.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.124.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.124.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.124.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.124.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.124.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.125.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.125.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.125.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.125.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.125.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.126.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.126.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.126.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.126.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.126.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.127.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.127.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.127.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.127.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.127.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.128.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.128.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.128.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.128.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.128.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.129.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.129.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.129.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.129.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.129.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.130.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.130.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.130.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.130.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.130.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.131.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.131.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.131.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.131.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.131.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.132.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.132.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.132.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.132.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.132.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.133.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.133.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.133.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.133.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.133.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.134.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.134.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.134.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.134.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.134.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.135.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.135.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.135.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.135.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.135.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.136.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.136.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.136.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.136.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.136.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.137.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.137.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.137.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.137.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.137.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.138.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.138.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.138.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.138.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.138.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.139.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.139.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.139.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.139.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.139.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.140.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.140.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.140.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.140.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.140.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.141.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.141.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.141.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.141.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.141.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.142.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.142.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.142.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.142.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.142.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.143.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.143.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.143.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.143.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.143.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.144.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.144.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.144.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.144.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.144.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.145.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.145.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.145.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.145.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.145.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.146.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.146.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.146.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.146.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.146.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.147.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.147.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.147.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.147.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.147.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.148.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.148.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.148.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.148.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.148.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.149.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.149.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.149.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.149.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.149.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.150.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.150.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.150.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.150.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.150.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.151.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.151.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.151.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.151.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.151.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.152.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.152.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.152.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.152.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.152.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.153.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.153.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.153.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.153.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.153.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.154.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.154.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.154.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.154.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.154.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.155.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.155.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.155.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.155.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.155.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.156.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.156.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.156.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.156.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.156.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.157.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.157.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.157.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.157.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.157.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.158.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.158.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.158.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.158.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.158.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.159.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.159.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.159.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.159.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.159.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.160.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.160.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.160.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.160.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.160.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.160.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.161.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.161.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.161.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.161.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.161.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.161.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.162.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.162.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.162.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.162.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.162.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.162.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.163.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.163.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.163.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.163.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.163.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.163.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.164.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.164.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.164.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.164.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.164.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.164.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.165.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.165.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.165.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.165.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.165.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.165.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.166.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.166.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.166.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.166.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.166.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.166.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.167.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.167.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.167.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.167.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.167.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.167.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.168.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.168.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.168.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.168.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.168.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.168.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.169.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.169.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.169.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.169.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.169.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.169.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.170.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.170.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.170.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.170.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.170.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.170.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.171.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.171.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.171.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.171.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.171.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.171.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.172.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.172.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.172.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.172.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.172.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.172.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.173.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.173.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.173.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.173.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.173.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.173.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.174.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.174.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.174.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.174.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.174.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.174.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.175.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.175.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.175.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.175.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.175.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.175.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.176.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.176.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.176.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.176.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.176.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.176.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.177.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.177.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.177.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.177.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.177.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.177.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.178.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.178.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.178.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.178.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.178.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.178.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.179.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.179.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.179.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.179.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.179.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.179.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.180.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.180.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.180.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.180.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.180.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.180.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.181.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.181.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.181.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.181.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.181.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.181.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.182.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.182.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.182.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.182.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.182.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.182.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.183.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.183.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.183.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.183.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.183.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.183.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.184.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.184.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.184.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.184.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.184.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.184.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.185.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.185.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.185.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.185.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.185.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.185.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.186.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.186.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.186.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.186.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.186.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.186.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.187.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.187.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.187.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.187.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.187.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.187.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.188.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.188.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.188.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.188.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.188.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.188.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.189.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.189.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.189.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.189.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.189.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.189.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.190.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.190.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.190.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.190.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.190.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.190.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.191.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.191.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.191.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.191.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.191.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.191.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.192.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.192.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.192.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.192.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.192.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.192.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.193.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.193.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.193.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.193.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.193.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.193.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.194.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.194.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.194.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.194.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.194.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.194.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.195.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.195.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.195.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.195.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.195.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.195.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.196.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.196.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.196.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.196.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.196.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.196.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.197.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.197.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.197.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.197.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.197.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.197.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.198.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.198.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.198.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.198.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.198.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.198.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.199.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.199.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.199.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.199.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.199.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.199.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.200.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.200.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.200.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.200.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.200.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.200.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.201.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.201.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.201.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.201.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.201.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.201.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.202.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.202.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.202.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.202.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.202.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.202.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.203.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.203.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.203.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.203.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.203.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.203.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.204.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.204.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.204.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.204.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.204.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.204.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.205.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.205.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.205.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.205.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.205.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.205.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.206.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.206.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.206.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.206.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.206.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.206.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.207.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.207.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.207.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.207.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.207.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.207.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.208.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.208.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.208.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.208.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.208.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.208.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.209.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.209.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.209.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.209.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.209.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.209.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.210.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.210.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.210.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.210.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.210.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.210.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.211.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.211.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.211.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.211.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.211.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.211.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.212.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.212.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.212.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.212.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.212.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.212.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.213.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.213.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.213.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.213.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.213.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.213.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.214.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.214.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.214.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.214.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.214.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.214.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.215.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.215.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.215.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.215.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.215.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.215.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.216.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.216.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.216.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.216.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.216.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.216.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.217.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.217.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.217.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.217.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.217.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.217.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.218.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.218.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.218.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.218.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.218.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.218.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.219.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.219.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.219.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.219.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.219.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.219.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.220.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.220.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.220.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.220.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.220.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.220.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.221.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.221.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.221.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.221.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.221.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.221.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.222.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.222.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.222.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.222.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.222.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.222.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.223.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.223.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.223.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.223.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.223.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.223.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.224.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.224.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.224.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.224.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.224.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.224.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.225.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.225.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.225.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.225.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.225.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.225.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.226.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.226.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.226.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.226.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.226.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.226.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.227.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.227.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.227.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.227.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.227.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.227.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.228.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.228.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.228.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.228.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.228.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.228.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.229.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.229.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.229.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.229.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.229.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.229.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.230.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.230.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.230.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.230.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.230.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.230.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.231.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.231.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.231.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.231.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.231.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.231.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.232.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.232.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.232.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.232.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.232.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.232.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.233.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.233.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.233.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.233.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.233.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.233.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.234.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.234.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.234.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.234.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.234.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.234.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.235.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.235.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.235.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.235.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.235.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.235.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.236.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.236.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.236.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.236.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.236.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.236.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.237.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.237.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.237.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.237.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.237.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.237.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.238.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.238.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.238.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.238.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.238.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.238.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.239.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.239.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.239.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.239.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.239.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.239.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.240.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.240.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.240.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.240.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.240.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.240.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.241.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.241.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.241.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.241.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.241.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.241.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.242.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.242.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.242.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.242.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.242.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.242.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.243.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.243.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.243.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.243.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.243.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.243.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.244.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.244.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.244.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.244.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.244.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.244.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.245.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.245.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.245.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.245.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.245.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.245.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.246.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.246.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.246.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.246.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.246.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.246.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.247.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.247.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.247.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.247.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.247.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.247.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.248.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.248.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.248.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.248.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.248.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.248.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.249.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.249.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.249.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.249.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.249.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.249.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.250.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.250.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.250.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.250.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.250.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.250.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.251.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.251.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.251.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.251.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.251.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.251.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.252.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.252.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.252.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.252.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.252.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.252.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.253.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.253.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.253.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.253.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.253.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.253.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.254.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.254.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.254.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.254.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.254.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.254.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.255.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.255.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.255.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.255.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.255.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.255.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.input_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.20.post_attention_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.q_a_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.q_a_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.q_a_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.q_b_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.q_b_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.kv_b_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.kv_b_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.o_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.o_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.gate.weight": "model-00051-of-000163.safetensors", "model.layers.21.mlp.gate.e_score_correction_bias": "model-00051-of-000163.safetensors", "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.shared_experts.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.shared_experts.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.0.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.0.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.0.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.0.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.0.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.1.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.1.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.1.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.1.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.1.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.2.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.2.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.2.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.2.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.2.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.3.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.3.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.3.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.3.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.3.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.4.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.4.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.4.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.4.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.4.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.5.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.5.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.5.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.5.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.5.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.6.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.6.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.6.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.6.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.6.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.7.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.7.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.7.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.7.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.7.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.8.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.8.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.8.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.8.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.8.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.9.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.9.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.9.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.9.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.9.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.10.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.10.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.10.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.10.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.10.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.11.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.11.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.11.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.11.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.11.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.12.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.12.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.12.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.12.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.12.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.13.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.13.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.13.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.13.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.13.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.14.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.14.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.14.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.14.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.14.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.15.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.15.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.15.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.15.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.15.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.16.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.16.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.16.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.16.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.16.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.17.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.17.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.17.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.17.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.17.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.18.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.18.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.18.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.18.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.18.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.19.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.19.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.19.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.19.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.19.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.20.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.20.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.20.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.20.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.20.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.21.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.21.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.21.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.21.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.21.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.22.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.22.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.22.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.22.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.22.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.23.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.23.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.23.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.23.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.23.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.24.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.24.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.24.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.24.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.24.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.25.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.25.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.25.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.25.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.25.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.26.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.26.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.26.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.26.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.26.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.27.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.27.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.27.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.27.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.27.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.28.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.28.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.28.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.28.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.28.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.29.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.29.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.29.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.29.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.29.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.30.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.30.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.30.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.30.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.30.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.31.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.31.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.31.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.31.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.31.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.32.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.32.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.32.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.32.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.32.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.33.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.33.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.33.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.33.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.33.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.34.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.34.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.34.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.34.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.34.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.35.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.35.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.35.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.35.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.35.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.36.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.36.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.36.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.36.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.36.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.37.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.37.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.37.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.37.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.37.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.38.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.38.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.38.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.38.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.38.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.39.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.39.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.39.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.39.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.39.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.40.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.40.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.40.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.40.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.40.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.41.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.41.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.41.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.41.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.41.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.42.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.42.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.42.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.42.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.42.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.43.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.43.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.43.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.43.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.43.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.44.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.44.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.44.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.44.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.44.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.45.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.45.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.45.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.45.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.45.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.46.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.46.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.46.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.46.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.46.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.47.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.47.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.47.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.47.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.47.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.48.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.48.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.48.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.48.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.48.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.49.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.49.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.49.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.49.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.49.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.50.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.50.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.50.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.50.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.50.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.51.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.51.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.51.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.51.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.51.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.52.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.52.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.52.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.52.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.52.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.53.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.53.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.53.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.53.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.53.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.54.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.54.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.54.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.54.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.54.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.55.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.55.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.55.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.55.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.55.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.56.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.56.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.56.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.56.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.56.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.57.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.57.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.57.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.57.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.57.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.58.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.58.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.58.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.58.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.58.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.59.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.59.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.59.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.59.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.59.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.60.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.60.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.60.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.60.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.60.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.61.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.61.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.61.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.61.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.61.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.62.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.62.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.62.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.62.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.62.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.63.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.63.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.63.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.63.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.63.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.64.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.64.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.64.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.64.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.64.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.65.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.65.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.65.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.65.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.65.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.66.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.66.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.66.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.66.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.66.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.67.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.67.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.67.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.67.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.67.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.68.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.68.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.68.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.68.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.68.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.69.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.69.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.69.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.69.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.69.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.70.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.70.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.70.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.70.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.70.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.71.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.71.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.71.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.71.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.71.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.72.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.72.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.72.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.72.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.72.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.73.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.73.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.73.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.73.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.73.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.74.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.74.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.74.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.74.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.74.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.75.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.75.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.75.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.75.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.75.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.76.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.76.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.76.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.76.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.76.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.77.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.77.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.77.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.77.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.77.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.78.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.78.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.78.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.78.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.78.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.79.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.79.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.79.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.79.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.79.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.80.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.80.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.80.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.80.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.80.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.81.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.81.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.81.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.81.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.81.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.82.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.82.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.82.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.82.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.82.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.83.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.83.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.83.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.83.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.83.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.84.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.84.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.84.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.84.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.84.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.85.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.85.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.85.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.85.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.85.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.86.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.86.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.86.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.86.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.86.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.87.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.87.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.87.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.87.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.87.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.88.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.88.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.88.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.88.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.88.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.89.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.89.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.89.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.89.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.89.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.90.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.90.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.90.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.90.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.90.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.91.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.91.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.91.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.91.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.91.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.92.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.92.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.92.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.92.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.92.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.93.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.93.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.93.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.93.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.93.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.94.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.94.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.94.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.94.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.94.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.95.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.95.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.95.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.95.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.95.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.96.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.96.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.96.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.96.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.96.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.97.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.97.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.97.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.97.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.97.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.98.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.98.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.98.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.98.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.98.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.99.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.99.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.99.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.99.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.99.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.100.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.100.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.100.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.100.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.100.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.101.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.101.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.101.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.101.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.101.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.102.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.102.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.102.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.102.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.102.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.103.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.103.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.103.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.103.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.103.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.104.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.104.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.104.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.104.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.104.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.105.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.105.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.105.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.105.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.105.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.106.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.106.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.106.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.106.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.106.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.107.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.107.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.107.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.107.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.107.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.108.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.108.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.108.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.108.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.108.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.109.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.109.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.109.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.109.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.109.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.110.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.110.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.110.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.110.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.110.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.111.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.111.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.111.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.111.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.111.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.112.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.112.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.112.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.112.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.112.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.113.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.113.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.113.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.113.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.113.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.114.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.114.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.114.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.114.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.114.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.115.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.115.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.115.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.115.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.115.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.116.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.116.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.116.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.116.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.116.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.117.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.117.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.117.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.117.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.117.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.118.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.118.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.118.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.118.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.118.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.119.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.119.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.119.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.119.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.119.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.120.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.120.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.120.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.120.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.120.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.121.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.121.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.121.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.121.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.121.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.122.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.122.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.122.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.122.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.122.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.123.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.123.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.123.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.123.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.123.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.124.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.124.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.124.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.124.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.124.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.125.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.125.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.125.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.125.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.125.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.126.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.126.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.126.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.126.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.126.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.127.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.127.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.127.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.127.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.127.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.128.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.128.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.128.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.128.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.128.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.129.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.129.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.129.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.129.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.129.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.130.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.130.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.130.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.130.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.130.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.131.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.131.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.131.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.131.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.131.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.132.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.132.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.132.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.132.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.132.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.133.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.133.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.133.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.133.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.133.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.134.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.134.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.134.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.134.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.134.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.135.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.135.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.135.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.135.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.135.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.136.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.136.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.136.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.136.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.136.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.137.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.137.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.137.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.137.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.137.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.138.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.138.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.138.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.138.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.138.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.139.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.139.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.139.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.139.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.139.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.140.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.140.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.140.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.140.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.140.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.141.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.141.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.141.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.141.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.141.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.142.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.142.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.142.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.142.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.142.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.143.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.143.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.143.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.143.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.143.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.144.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.144.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.144.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.144.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.144.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.145.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.145.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.145.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.145.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.145.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.146.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.146.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.146.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.146.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.146.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.147.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.147.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.147.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.147.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.147.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.148.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.148.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.148.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.148.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.148.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.149.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.149.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.149.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.149.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.149.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.150.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.150.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.150.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.150.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.150.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.151.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.151.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.151.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.151.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.151.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.152.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.152.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.152.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.152.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.152.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.153.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.153.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.153.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.153.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.153.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.154.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.154.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.154.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.154.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.154.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.155.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.155.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.155.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.155.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.155.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.156.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.156.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.156.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.156.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.156.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.157.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.157.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.157.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.157.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.157.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.158.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.158.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.158.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.158.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.158.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.159.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.159.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.159.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.159.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.159.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.160.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.160.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.160.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.160.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.160.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.160.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.161.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.161.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.161.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.161.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.161.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.161.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.162.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.162.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.162.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.162.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.162.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.162.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.163.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.163.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.163.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.163.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.163.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.163.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.164.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.164.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.164.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.164.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.164.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.164.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.165.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.165.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.165.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.165.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.165.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.165.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.166.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.166.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.166.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.166.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.166.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.166.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.167.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.167.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.167.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.167.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.167.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.167.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.168.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.168.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.168.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.168.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.168.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.168.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.169.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.169.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.169.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.169.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.169.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.169.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.170.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.170.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.170.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.170.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.170.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.170.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.171.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.171.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.171.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.171.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.171.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.171.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.172.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.172.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.172.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.172.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.172.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.172.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.173.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.173.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.173.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.173.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.173.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.173.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.174.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.174.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.174.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.174.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.174.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.174.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.175.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.175.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.175.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.175.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.175.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.175.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.176.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.176.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.176.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.176.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.176.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.176.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.177.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.177.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.177.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.177.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.177.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.177.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.178.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.178.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.178.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.178.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.178.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.178.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.179.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.179.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.179.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.179.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.179.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.179.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.180.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.180.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.180.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.180.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.180.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.180.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.181.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.181.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.181.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.181.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.181.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.181.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.182.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.182.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.182.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.182.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.182.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.182.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.183.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.183.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.183.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.183.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.183.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.183.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.184.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.184.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.184.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.184.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.184.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.184.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.185.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.185.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.185.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.185.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.185.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.185.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.186.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.186.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.186.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.186.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.186.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.186.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.187.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.187.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.187.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.187.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.187.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.187.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.188.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.188.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.188.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.188.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.188.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.188.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.189.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.189.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.189.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.189.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.189.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.189.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.190.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.190.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.190.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.190.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.190.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.190.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.191.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.191.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.191.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.191.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.191.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.191.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.192.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.192.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.192.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.192.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.192.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.192.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.193.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.193.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.193.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.193.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.193.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.193.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.194.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.194.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.194.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.194.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.194.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.194.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.195.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.195.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.195.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.195.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.195.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.195.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.196.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.196.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.196.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.196.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.196.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.196.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.197.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.197.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.197.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.197.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.197.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.197.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.198.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.198.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.198.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.198.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.198.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.198.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.199.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.199.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.199.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.199.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.199.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.199.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.200.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.200.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.200.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.200.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.200.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.200.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.201.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.201.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.201.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.201.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.201.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.201.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.202.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.202.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.202.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.202.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.202.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.202.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.203.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.203.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.203.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.203.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.203.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.203.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.204.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.204.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.204.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.204.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.204.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.204.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.205.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.205.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.205.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.205.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.205.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.205.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.206.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.206.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.206.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.206.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.206.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.206.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.207.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.207.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.207.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.207.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.207.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.207.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.208.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.208.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.208.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.208.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.208.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.208.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.209.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.209.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.209.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.209.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.209.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.209.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.210.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.210.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.210.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.210.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.210.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.210.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.211.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.211.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.211.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.211.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.211.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.211.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.212.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.212.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.212.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.212.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.212.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.212.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.213.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.213.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.213.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.213.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.213.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.213.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.214.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.214.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.214.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.214.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.214.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.214.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.215.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.215.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.215.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.215.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.215.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.215.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.216.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.216.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.216.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.216.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.216.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.216.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.217.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.217.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.217.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.217.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.217.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.217.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.218.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.218.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.218.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.218.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.218.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.218.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.219.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.219.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.219.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.219.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.219.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.219.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.220.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.220.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.220.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.220.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.220.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.220.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.221.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.221.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.221.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.221.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.221.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.221.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.222.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.222.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.222.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.222.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.222.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.222.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.223.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.223.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.223.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.223.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.223.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.223.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.224.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.224.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.224.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.224.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.224.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.224.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.225.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.225.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.225.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.225.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.225.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.225.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.226.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.226.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.226.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.226.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.226.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.226.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.227.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.227.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.227.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.227.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.227.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.227.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.228.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.228.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.228.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.228.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.228.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.228.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.229.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.229.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.229.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.229.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.229.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.229.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.230.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.230.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.230.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.230.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.230.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.230.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.231.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.231.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.231.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.231.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.231.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.231.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.232.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.232.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.232.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.232.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.232.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.232.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.233.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.233.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.233.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.233.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.233.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.233.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.234.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.234.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.234.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.234.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.234.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.234.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.235.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.235.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.235.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.235.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.235.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.235.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.236.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.236.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.236.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.236.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.236.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.236.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.237.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.237.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.237.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.237.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.237.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.237.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.238.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.238.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.238.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.238.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.238.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.238.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.239.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.239.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.239.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.239.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.239.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.239.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.240.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.240.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.240.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.240.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.240.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.240.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.241.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.241.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.241.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.241.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.241.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.241.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.242.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.242.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.242.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.242.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.242.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.242.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.243.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.243.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.243.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.243.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.243.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.243.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.244.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.244.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.244.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.244.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.244.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.244.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.245.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.245.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.245.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.245.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.245.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.245.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.246.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.246.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.246.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.246.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.246.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.246.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.247.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.247.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.247.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.247.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.247.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.247.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.248.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.248.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.248.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.248.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.248.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.248.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.249.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.249.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.249.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.249.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.249.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.249.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.250.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.250.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.250.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.250.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.250.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.250.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.251.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.251.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.251.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.251.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.251.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.251.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.252.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.252.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.252.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.252.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.252.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.252.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.253.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.253.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.253.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.253.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.253.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.253.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.254.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.254.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.254.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.254.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.254.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.254.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.255.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.255.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.255.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.255.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.255.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.255.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.input_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.21.post_attention_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.q_a_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.q_a_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.q_a_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.q_b_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.q_b_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.kv_b_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.kv_b_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.o_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.o_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.gate.weight": "model-00053-of-000163.safetensors", "model.layers.22.mlp.gate.e_score_correction_bias": "model-00053-of-000163.safetensors", "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.shared_experts.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.shared_experts.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.0.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.0.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.0.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.0.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.0.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.1.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.1.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.1.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.1.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.1.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.2.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.2.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.2.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.2.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.2.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.3.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.3.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.3.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.3.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.3.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.4.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.4.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.4.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.4.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.4.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.5.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.5.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.5.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.5.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.5.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.6.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.6.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.6.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.6.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.6.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.7.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.7.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.7.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.7.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.7.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.8.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.8.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.8.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.8.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.8.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.9.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.9.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.9.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.9.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.9.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.10.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.10.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.10.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.10.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.10.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.11.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.11.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.11.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.11.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.11.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.12.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.12.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.12.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.12.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.12.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.13.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.13.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.13.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.13.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.13.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.14.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.14.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.14.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.14.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.14.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.15.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.15.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.15.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.15.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.15.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.16.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.16.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.16.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.16.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.16.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.17.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.17.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.17.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.17.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.17.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.18.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.18.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.18.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.18.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.18.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.19.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.19.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.19.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.19.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.19.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.20.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.20.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.20.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.20.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.20.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.21.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.21.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.21.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.21.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.21.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.22.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.22.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.22.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.22.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.22.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.23.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.23.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.23.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.23.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.23.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.24.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.24.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.24.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.24.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.24.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.25.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.25.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.25.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.25.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.25.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.26.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.26.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.26.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.26.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.26.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.27.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.27.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.27.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.27.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.27.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.28.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.28.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.28.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.28.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.28.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.29.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.29.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.29.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.29.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.29.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.30.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.30.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.30.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.30.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.30.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.31.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.31.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.31.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.31.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.31.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.32.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.32.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.32.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.32.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.32.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.33.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.33.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.33.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.33.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.33.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.34.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.34.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.34.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.34.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.34.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.35.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.35.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.35.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.35.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.35.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.36.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.36.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.36.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.36.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.36.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.37.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.37.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.37.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.37.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.37.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.38.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.38.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.38.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.38.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.38.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.39.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.39.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.39.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.39.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.39.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.40.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.40.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.40.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.40.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.40.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.41.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.41.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.41.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.41.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.41.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.42.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.42.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.42.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.42.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.42.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.43.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.43.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.43.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.43.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.43.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.44.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.44.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.44.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.44.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.44.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.45.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.45.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.45.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.45.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.45.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.46.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.46.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.46.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.46.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.46.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.47.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.47.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.47.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.47.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.47.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.48.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.48.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.48.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.48.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.48.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.49.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.49.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.49.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.49.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.49.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.50.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.50.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.50.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.50.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.50.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.51.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.51.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.51.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.51.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.51.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.52.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.52.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.52.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.52.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.52.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.53.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.53.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.53.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.53.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.53.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.54.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.54.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.54.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.54.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.54.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.55.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.55.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.55.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.55.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.55.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.56.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.56.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.56.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.56.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.56.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.57.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.57.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.57.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.57.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.57.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.58.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.58.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.58.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.58.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.58.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.59.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.59.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.59.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.59.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.59.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.60.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.60.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.60.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.60.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.60.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.61.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.61.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.61.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.61.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.61.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.62.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.62.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.62.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.62.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.62.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.63.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.63.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.63.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.63.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.63.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.64.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.64.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.64.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.64.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.64.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.65.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.65.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.65.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.65.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.65.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.66.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.66.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.66.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.66.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.66.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.67.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.67.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.67.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.67.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.67.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.68.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.68.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.68.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.68.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.68.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.69.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.69.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.69.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.69.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.69.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.70.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.70.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.70.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.70.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.70.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.71.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.71.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.71.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.71.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.71.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.72.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.72.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.72.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.72.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.72.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.73.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.73.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.73.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.73.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.73.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.74.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.74.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.74.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.74.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.74.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.75.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.75.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.75.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.75.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.75.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.76.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.76.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.76.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.76.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.76.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.77.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.77.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.77.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.77.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.77.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.78.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.78.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.78.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.78.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.78.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.79.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.79.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.79.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.79.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.79.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.80.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.80.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.80.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.80.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.80.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.81.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.81.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.81.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.81.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.81.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.82.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.82.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.82.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.82.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.82.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.83.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.83.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.83.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.83.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.83.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.84.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.84.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.84.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.84.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.84.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.85.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.85.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.85.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.85.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.85.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.86.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.86.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.86.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.86.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.86.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.87.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.87.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.87.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.87.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.87.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.88.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.88.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.88.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.88.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.88.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.89.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.89.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.89.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.89.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.89.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.90.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.90.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.90.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.90.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.90.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.91.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.91.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.91.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.91.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.91.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.92.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.92.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.92.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.92.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.92.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.93.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.93.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.93.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.93.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.93.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.94.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.94.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.94.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.94.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.94.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.95.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.95.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.95.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.95.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.95.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.96.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.96.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.96.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.96.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.96.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.97.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.97.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.97.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.97.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.97.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.98.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.98.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.98.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.98.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.98.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.99.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.99.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.99.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.99.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.99.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.100.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.100.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.100.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.100.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.100.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.101.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.101.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.101.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.101.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.101.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.102.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.102.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.102.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.102.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.102.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.103.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.103.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.103.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.103.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.103.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.104.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.104.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.104.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.104.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.104.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.105.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.105.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.105.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.105.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.105.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.106.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.106.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.106.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.106.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.106.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.107.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.107.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.107.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.107.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.107.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.108.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.108.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.108.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.108.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.108.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.109.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.109.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.109.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.109.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.109.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.110.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.110.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.110.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.110.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.110.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.111.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.111.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.111.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.111.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.111.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.112.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.112.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.112.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.112.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.112.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.113.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.113.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.113.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.113.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.113.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.114.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.114.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.114.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.114.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.114.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.115.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.115.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.115.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.115.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.115.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.116.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.116.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.116.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.116.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.116.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.117.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.117.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.117.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.117.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.117.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.118.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.118.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.118.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.118.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.118.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.119.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.119.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.119.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.119.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.119.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.120.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.120.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.120.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.120.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.120.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.121.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.121.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.121.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.121.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.121.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.122.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.122.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.122.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.122.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.122.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.123.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.123.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.123.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.123.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.123.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.124.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.124.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.124.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.124.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.124.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.125.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.125.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.125.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.125.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.125.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.126.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.126.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.126.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.126.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.126.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.127.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.127.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.127.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.127.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.127.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.128.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.128.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.128.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.128.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.128.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.129.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.129.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.129.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.129.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.129.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.130.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.130.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.130.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.130.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.130.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.131.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.131.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.131.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.131.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.131.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.132.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.132.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.132.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.132.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.132.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.133.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.133.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.133.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.133.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.133.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.134.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.134.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.134.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.134.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.134.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.135.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.135.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.135.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.135.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.135.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.136.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.136.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.136.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.136.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.136.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.137.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.137.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.137.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.137.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.137.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.138.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.138.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.138.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.138.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.138.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.139.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.139.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.139.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.139.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.139.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.140.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.140.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.140.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.140.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.140.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.141.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.141.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.141.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.141.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.141.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.142.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.142.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.142.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.142.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.142.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.143.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.143.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.143.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.143.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.143.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.144.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.144.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.144.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.144.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.144.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.145.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.145.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.145.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.145.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.145.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.146.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.146.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.146.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.146.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.146.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.147.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.147.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.147.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.147.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.147.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.148.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.148.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.148.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.148.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.148.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.149.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.149.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.149.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.149.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.149.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.150.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.150.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.150.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.150.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.150.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.151.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.151.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.151.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.151.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.151.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.152.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.152.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.152.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.152.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.152.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.153.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.153.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.153.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.153.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.153.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.154.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.154.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.154.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.154.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.154.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.155.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.155.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.155.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.155.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.155.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.156.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.156.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.156.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.156.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.156.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.157.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.157.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.157.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.157.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.157.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.158.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.158.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.158.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.158.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.158.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.159.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.159.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.159.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.159.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.159.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.160.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.160.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.160.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.160.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.160.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.160.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.161.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.161.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.161.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.161.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.161.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.161.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.162.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.162.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.162.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.162.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.162.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.162.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.163.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.163.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.163.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.163.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.163.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.163.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.164.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.164.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.164.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.164.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.164.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.164.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.165.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.165.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.165.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.165.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.165.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.165.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.166.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.166.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.166.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.166.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.166.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.166.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.167.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.167.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.167.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.167.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.167.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.167.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.168.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.168.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.168.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.168.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.168.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.168.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.169.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.169.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.169.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.169.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.169.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.169.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.170.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.170.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.170.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.170.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.170.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.170.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.171.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.171.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.171.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.171.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.171.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.171.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.172.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.172.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.172.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.172.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.172.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.172.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.173.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.173.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.173.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.173.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.173.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.173.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.174.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.174.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.174.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.174.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.174.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.174.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.175.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.175.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.175.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.175.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.175.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.175.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.176.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.176.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.176.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.176.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.176.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.176.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.177.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.177.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.177.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.177.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.177.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.177.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.178.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.178.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.178.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.178.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.178.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.178.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.179.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.179.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.179.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.179.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.179.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.179.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.180.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.180.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.180.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.180.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.180.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.180.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.181.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.181.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.181.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.181.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.181.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.181.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.182.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.182.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.182.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.182.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.182.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.182.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.183.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.183.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.183.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.183.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.183.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.183.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.184.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.184.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.184.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.184.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.184.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.184.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.185.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.185.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.185.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.185.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.185.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.185.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.186.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.186.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.186.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.186.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.186.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.186.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.187.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.187.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.187.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.187.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.187.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.187.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.188.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.188.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.188.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.188.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.188.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.188.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.189.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.189.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.189.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.189.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.189.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.189.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.190.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.190.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.190.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.190.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.190.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.190.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.191.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.191.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.191.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.191.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.191.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.191.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.192.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.192.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.192.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.192.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.192.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.192.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.193.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.193.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.193.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.193.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.193.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.193.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.194.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.194.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.194.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.194.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.194.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.194.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.195.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.195.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.195.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.195.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.195.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.195.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.196.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.196.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.196.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.196.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.196.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.196.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.197.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.197.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.197.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.197.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.197.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.197.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.198.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.198.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.198.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.198.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.198.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.198.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.199.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.199.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.199.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.199.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.199.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.199.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.200.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.200.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.200.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.200.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.200.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.200.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.201.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.201.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.201.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.201.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.201.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.201.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.202.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.202.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.202.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.202.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.202.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.202.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.203.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.203.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.203.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.203.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.203.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.203.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.204.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.204.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.204.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.204.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.204.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.204.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.205.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.205.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.205.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.205.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.205.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.205.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.206.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.206.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.206.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.206.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.206.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.206.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.207.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.207.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.207.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.207.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.207.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.207.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.208.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.208.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.208.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.208.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.208.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.208.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.209.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.209.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.209.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.209.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.209.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.209.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.210.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.210.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.210.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.210.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.210.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.210.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.211.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.211.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.211.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.211.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.211.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.211.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.212.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.212.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.212.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.212.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.212.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.212.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.213.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.213.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.213.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.213.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.213.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.213.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.214.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.214.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.214.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.214.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.214.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.214.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.215.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.215.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.215.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.215.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.215.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.215.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.216.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.216.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.216.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.216.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.216.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.216.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.217.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.217.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.217.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.217.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.217.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.217.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.218.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.218.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.218.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.218.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.218.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.218.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.219.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.219.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.219.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.219.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.219.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.219.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.220.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.220.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.220.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.220.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.220.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.220.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.221.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.221.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.221.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.221.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.221.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.221.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.222.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.222.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.222.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.222.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.222.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.222.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.223.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.223.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.223.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.223.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.223.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.223.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.224.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.224.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.224.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.224.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.224.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.224.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.225.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.225.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.225.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.225.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.225.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.225.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.226.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.226.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.226.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.226.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.226.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.226.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.227.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.227.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.227.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.227.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.227.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.227.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.228.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.228.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.228.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.228.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.228.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.228.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.229.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.229.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.229.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.229.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.229.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.229.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.230.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.230.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.230.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.230.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.230.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.230.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.231.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.231.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.231.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.231.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.231.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.231.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.232.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.232.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.232.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.232.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.232.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.232.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.233.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.233.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.233.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.233.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.233.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.233.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.234.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.234.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.234.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.234.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.234.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.234.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.235.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.235.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.235.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.235.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.235.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.235.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.236.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.236.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.236.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.236.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.236.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.236.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.237.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.237.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.237.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.237.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.237.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.237.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.238.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.238.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.238.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.238.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.238.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.238.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.239.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.239.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.239.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.239.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.239.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.239.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.240.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.240.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.240.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.240.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.240.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.240.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.241.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.241.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.241.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.241.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.241.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.241.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.242.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.242.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.242.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.242.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.242.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.242.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.243.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.243.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.243.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.243.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.243.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.243.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.244.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.244.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.244.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.244.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.244.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.244.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.245.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.245.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.245.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.245.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.245.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.245.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.246.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.246.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.246.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.246.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.246.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.246.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.247.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.247.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.247.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.247.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.247.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.247.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.248.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.248.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.248.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.248.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.248.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.248.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.249.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.249.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.249.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.249.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.249.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.249.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.250.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.250.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.250.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.250.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.250.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.250.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.251.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.251.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.251.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.251.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.251.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.251.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.252.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.252.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.252.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.252.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.252.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.252.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.253.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.253.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.253.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.253.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.253.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.253.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.254.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.254.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.254.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.254.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.254.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.254.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.255.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.255.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.255.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.255.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.255.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.255.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.input_layernorm.weight": "model-00056-of-000163.safetensors", "model.layers.22.post_attention_layernorm.weight": "model-00056-of-000163.safetensors", "model.layers.23.self_attn.q_a_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.q_a_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.q_a_layernorm.weight": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.q_b_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.q_b_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.kv_b_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.kv_b_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.o_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.o_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.gate.weight": "model-00057-of-000163.safetensors", "model.layers.23.mlp.gate.e_score_correction_bias": "model-00057-of-000163.safetensors", "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.shared_experts.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.shared_experts.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.0.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.0.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.0.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.0.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.0.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.1.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.1.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.1.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.1.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.1.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.2.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.2.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.2.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.2.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.2.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.3.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.3.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.3.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.3.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.3.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.4.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.4.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.4.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.4.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.4.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.5.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.5.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.5.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.5.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.5.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.6.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.6.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.6.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.6.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.6.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.7.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.7.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.7.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.7.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.7.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.8.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.8.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.8.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.8.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.8.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.9.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.9.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.9.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.9.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.9.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.10.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.10.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.10.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.10.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.10.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.11.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.11.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.11.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.11.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.11.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.12.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.12.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.12.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.12.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.12.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.13.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.13.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.13.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.13.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.13.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.14.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.14.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.14.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.14.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.14.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.15.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.15.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.15.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.15.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.15.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.16.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.16.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.16.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.16.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.16.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.17.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.17.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.17.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.17.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.17.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.18.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.18.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.18.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.18.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.18.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.19.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.19.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.19.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.19.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.19.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.20.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.20.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.20.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.20.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.20.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.21.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.21.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.21.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.21.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.21.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.22.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.22.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.22.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.22.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.22.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.23.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.23.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.23.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.23.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.23.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.24.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.24.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.24.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.24.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.24.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.25.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.25.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.25.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.25.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.25.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.26.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.26.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.26.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.26.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.26.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.27.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.27.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.27.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.27.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.27.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.28.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.28.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.28.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.28.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.28.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.29.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.29.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.29.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.29.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.29.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.30.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.30.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.30.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.30.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.30.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.31.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.31.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.31.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.31.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.31.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.32.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.32.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.32.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.32.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.32.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.33.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.33.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.33.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.33.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.33.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.34.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.34.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.34.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.34.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.34.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.35.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.35.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.35.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.35.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.35.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.36.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.36.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.36.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.36.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.36.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.37.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.37.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.37.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.37.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.37.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.38.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.38.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.38.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.38.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.38.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.39.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.39.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.39.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.39.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.39.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.40.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.40.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.40.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.40.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.40.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.41.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.41.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.41.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.41.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.41.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.42.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.42.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.42.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.42.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.42.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.43.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.43.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.43.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.43.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.43.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.44.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.44.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.44.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.44.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.44.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.45.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.45.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.45.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.45.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.45.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.46.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.46.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.46.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.46.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.46.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.47.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.47.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.47.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.47.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.47.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.48.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.48.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.48.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.48.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.48.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.49.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.49.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.49.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.49.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.49.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.50.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.50.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.50.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.50.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.50.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.51.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.51.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.51.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.51.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.51.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.52.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.52.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.52.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.52.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.52.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.53.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.53.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.53.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.53.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.53.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.54.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.54.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.54.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.54.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.54.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.55.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.55.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.55.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.55.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.55.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.56.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.56.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.56.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.56.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.56.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.57.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.57.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.57.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.57.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.57.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.58.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.58.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.58.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.58.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.58.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.59.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.59.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.59.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.59.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.59.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.60.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.60.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.60.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.60.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.60.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.61.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.61.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.61.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.61.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.61.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.62.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.62.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.62.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.62.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.62.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.63.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.63.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.63.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.63.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.63.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.64.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.64.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.64.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.64.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.64.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.65.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.65.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.65.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.65.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.65.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.66.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.66.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.66.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.66.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.66.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.67.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.67.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.67.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.67.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.67.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.68.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.68.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.68.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.68.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.68.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.69.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.69.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.69.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.69.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.69.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.70.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.70.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.70.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.70.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.70.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.71.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.71.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.71.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.71.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.71.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.72.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.72.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.72.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.72.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.72.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.73.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.73.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.73.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.73.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.73.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.74.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.74.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.74.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.74.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.74.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.75.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.75.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.75.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.75.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.75.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.76.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.76.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.76.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.76.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.76.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.77.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.77.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.77.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.77.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.77.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.78.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.78.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.78.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.78.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.78.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.79.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.79.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.79.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.79.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.79.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.80.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.80.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.80.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.80.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.80.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.81.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.81.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.81.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.81.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.81.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.82.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.82.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.82.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.82.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.82.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.83.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.83.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.83.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.83.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.83.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.84.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.84.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.84.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.84.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.84.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.85.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.85.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.85.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.85.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.85.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.86.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.86.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.86.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.86.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.86.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.87.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.87.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.87.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.87.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.87.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.88.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.88.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.88.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.88.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.88.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.89.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.89.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.89.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.89.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.89.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.90.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.90.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.90.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.90.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.90.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.91.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.91.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.91.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.91.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.91.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.92.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.92.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.92.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.92.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.92.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.93.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.93.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.93.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.93.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.93.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.94.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.94.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.94.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.94.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.94.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.95.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.95.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.95.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.95.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.95.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.96.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.96.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.96.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.96.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.96.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.97.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.97.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.97.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.97.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.97.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.98.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.98.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.98.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.98.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.98.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.99.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.99.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.99.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.99.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.99.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.100.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.100.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.100.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.100.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.100.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.101.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.101.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.101.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.101.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.101.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.102.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.102.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.102.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.102.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.102.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.103.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.103.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.103.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.103.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.103.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.104.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.104.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.104.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.104.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.104.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.105.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.105.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.105.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.105.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.105.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.106.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.106.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.106.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.106.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.106.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.107.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.107.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.107.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.107.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.107.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.108.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.108.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.108.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.108.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.108.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.109.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.109.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.109.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.109.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.109.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.110.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.110.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.110.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.110.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.110.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.111.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.111.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.111.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.111.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.111.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.112.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.112.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.112.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.112.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.112.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.113.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.113.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.113.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.113.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.113.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.114.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.114.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.114.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.114.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.114.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.115.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.115.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.115.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.115.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.115.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.116.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.116.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.116.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.116.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.116.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.117.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.117.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.117.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.117.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.117.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.118.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.118.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.118.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.118.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.118.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.119.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.119.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.119.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.119.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.119.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.120.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.120.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.120.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.120.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.120.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.121.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.121.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.121.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.121.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.121.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.122.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.122.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.122.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.122.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.122.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.123.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.123.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.123.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.123.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.123.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.124.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.124.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.124.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.124.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.124.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.125.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.125.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.125.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.125.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.125.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.126.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.126.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.126.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.126.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.126.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.127.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.127.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.127.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.127.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.127.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.128.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.128.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.128.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.128.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.128.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.129.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.129.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.129.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.129.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.129.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.130.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.130.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.130.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.130.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.130.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.131.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.131.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.131.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.131.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.131.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.132.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.132.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.132.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.132.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.132.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.133.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.133.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.133.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.133.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.133.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.134.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.134.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.134.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.134.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.134.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.135.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.135.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.135.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.135.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.135.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.136.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.136.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.136.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.136.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.136.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.137.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.137.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.137.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.137.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.137.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.138.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.138.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.138.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.138.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.138.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.139.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.139.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.139.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.139.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.139.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.140.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.140.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.140.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.140.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.140.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.141.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.141.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.141.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.141.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.141.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.142.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.142.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.142.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.142.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.142.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.143.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.143.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.143.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.143.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.143.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.144.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.144.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.144.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.144.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.144.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.145.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.145.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.145.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.145.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.145.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.146.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.146.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.146.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.146.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.146.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.147.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.147.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.147.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.147.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.147.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.148.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.148.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.148.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.148.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.148.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.149.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.149.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.149.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.149.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.149.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.150.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.150.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.150.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.150.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.150.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.151.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.151.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.151.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.151.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.151.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.152.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.152.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.152.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.152.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.152.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.153.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.153.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.153.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.153.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.153.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.154.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.154.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.154.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.154.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.154.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.155.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.155.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.155.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.155.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.155.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.156.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.156.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.156.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.156.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.156.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.157.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.157.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.157.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.157.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.157.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.158.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.158.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.158.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.158.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.158.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.159.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.159.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.159.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.159.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.159.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.160.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.160.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.160.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.160.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.160.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.160.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.161.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.161.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.161.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.161.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.161.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.161.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.162.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.162.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.162.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.162.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.162.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.162.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.163.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.163.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.163.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.163.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.163.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.163.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.164.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.164.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.164.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.164.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.164.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.164.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.165.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.165.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.165.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.165.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.165.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.165.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.166.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.166.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.166.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.166.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.166.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.166.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.167.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.167.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.167.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.167.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.167.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.167.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.168.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.168.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.168.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.168.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.168.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.168.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.169.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.169.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.169.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.169.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.169.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.169.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.170.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.170.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.170.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.170.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.170.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.170.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.171.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.171.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.171.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.171.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.171.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.171.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.172.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.172.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.172.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.172.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.172.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.172.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.173.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.173.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.173.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.173.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.173.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.173.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.174.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.174.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.174.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.174.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.174.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.174.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.175.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.175.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.175.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.175.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.175.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.175.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.176.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.176.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.176.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.176.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.176.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.176.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.177.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.177.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.177.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.177.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.177.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.177.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.178.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.178.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.178.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.178.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.178.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.178.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.179.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.179.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.179.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.179.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.179.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.179.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.180.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.180.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.180.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.180.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.180.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.180.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.181.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.181.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.181.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.181.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.181.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.181.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.182.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.182.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.182.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.182.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.182.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.182.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.183.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.183.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.183.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.183.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.183.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.183.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.184.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.184.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.184.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.184.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.184.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.184.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.185.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.185.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.185.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.185.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.185.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.185.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.186.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.186.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.186.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.186.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.186.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.186.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.187.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.187.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.187.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.187.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.187.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.187.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.188.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.188.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.188.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.188.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.188.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.188.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.189.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.189.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.189.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.189.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.189.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.189.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.190.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.190.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.190.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.190.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.190.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.190.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.191.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.191.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.191.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.191.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.191.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.191.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.192.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.192.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.192.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.192.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.192.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.192.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.193.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.193.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.193.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.193.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.193.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.193.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.194.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.194.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.194.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.194.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.194.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.194.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.195.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.195.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.195.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.195.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.195.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.195.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.196.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.196.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.196.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.196.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.196.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.196.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.197.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.197.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.197.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.197.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.197.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.197.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.198.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.198.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.198.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.198.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.198.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.198.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.199.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.199.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.199.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.199.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.199.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.199.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.200.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.200.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.200.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.200.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.200.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.200.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.201.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.201.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.201.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.201.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.201.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.201.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.202.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.202.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.202.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.202.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.202.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.202.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.203.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.203.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.203.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.203.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.203.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.203.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.204.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.204.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.204.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.204.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.204.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.204.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.205.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.205.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.205.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.205.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.205.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.205.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.206.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.206.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.206.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.206.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.206.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.206.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.207.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.207.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.207.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.207.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.207.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.207.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.208.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.208.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.208.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.208.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.208.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.208.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.209.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.209.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.209.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.209.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.209.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.209.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.210.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.210.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.210.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.210.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.210.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.210.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.211.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.211.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.211.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.211.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.211.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.211.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.212.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.212.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.212.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.212.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.212.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.212.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.213.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.213.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.213.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.213.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.213.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.213.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.214.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.214.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.214.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.214.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.214.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.214.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.215.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.215.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.215.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.215.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.215.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.215.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.216.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.216.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.216.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.216.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.216.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.216.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.217.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.217.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.217.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.217.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.217.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.217.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.218.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.218.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.218.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.218.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.218.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.218.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.219.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.219.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.219.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.219.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.219.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.219.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.220.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.220.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.220.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.220.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.220.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.220.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.221.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.221.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.221.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.221.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.221.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.221.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.222.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.222.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.222.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.222.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.222.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.222.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.223.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.223.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.223.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.223.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.223.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.223.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.224.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.224.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.224.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.224.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.224.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.224.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.225.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.225.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.225.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.225.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.225.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.225.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.226.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.226.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.226.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.226.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.226.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.226.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.227.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.227.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.227.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.227.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.227.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.227.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.228.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.228.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.228.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.228.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.228.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.228.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.229.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.229.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.229.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.229.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.229.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.229.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.230.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.230.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.230.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.230.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.230.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.230.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.231.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.231.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.231.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.231.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.231.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.231.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.232.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.232.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.232.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.232.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.232.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.232.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.233.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.233.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.233.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.233.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.233.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.233.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.234.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.234.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.234.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.234.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.234.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.234.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.235.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.235.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.235.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.235.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.235.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.235.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.236.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.236.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.236.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.236.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.236.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.236.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.237.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.237.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.237.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.237.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.237.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.237.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.238.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.238.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.238.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.238.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.238.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.238.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.239.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.239.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.239.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.239.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.239.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.239.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.240.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.240.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.240.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.240.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.240.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.240.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.241.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.241.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.241.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.241.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.241.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.241.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.242.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.242.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.242.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.242.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.242.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.242.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.243.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.243.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.243.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.243.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.243.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.243.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.244.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.244.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.244.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.244.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.244.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.244.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.245.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.245.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.245.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.245.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.245.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.245.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.246.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.246.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.246.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.246.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.246.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.246.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.247.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.247.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.247.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.247.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.247.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.247.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.248.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.248.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.248.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.248.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.248.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.248.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.249.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.249.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.249.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.249.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.249.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.249.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.250.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.250.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.250.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.250.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.250.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.250.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.251.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.251.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.251.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.251.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.251.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.251.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.252.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.252.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.252.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.252.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.252.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.252.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.253.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.253.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.253.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.253.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.253.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.253.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.254.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.254.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.254.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.254.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.254.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.254.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.255.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.255.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.255.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.255.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.255.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.255.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.input_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.23.post_attention_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.q_a_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.q_a_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.q_a_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.q_b_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.q_b_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.kv_b_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.kv_b_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.o_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.o_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.gate.weight": "model-00059-of-000163.safetensors", "model.layers.24.mlp.gate.e_score_correction_bias": "model-00059-of-000163.safetensors", "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.shared_experts.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.shared_experts.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.0.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.0.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.0.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.0.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.0.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.1.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.1.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.1.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.1.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.1.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.2.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.2.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.2.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.2.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.2.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.3.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.3.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.3.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.3.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.3.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.4.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.4.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.4.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.4.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.4.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.5.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.5.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.5.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.5.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.5.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.6.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.6.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.6.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.6.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.6.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.7.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.7.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.7.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.7.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.7.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.8.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.8.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.8.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.8.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.8.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.9.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.9.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.9.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.9.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.9.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.10.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.10.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.10.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.10.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.10.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.11.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.11.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.11.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.11.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.11.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.12.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.12.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.12.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.12.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.12.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.13.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.13.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.13.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.13.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.13.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.14.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.14.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.14.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.14.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.14.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.15.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.15.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.15.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.15.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.15.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.16.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.16.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.16.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.16.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.16.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.17.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.17.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.17.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.17.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.17.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.18.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.18.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.18.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.18.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.18.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.19.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.19.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.19.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.19.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.19.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.20.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.20.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.20.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.20.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.20.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.21.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.21.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.21.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.21.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.21.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.22.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.22.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.22.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.22.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.22.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.23.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.23.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.23.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.23.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.23.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.24.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.24.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.24.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.24.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.24.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.25.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.25.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.25.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.25.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.25.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.26.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.26.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.26.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.26.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.26.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.27.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.27.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.27.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.27.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.27.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.28.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.28.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.28.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.28.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.28.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.29.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.29.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.29.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.29.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.29.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.30.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.30.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.30.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.30.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.30.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.31.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.31.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.31.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.31.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.31.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.32.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.32.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.32.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.32.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.32.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.33.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.33.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.33.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.33.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.33.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.34.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.34.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.34.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.34.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.34.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.35.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.35.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.35.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.35.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.35.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.36.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.36.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.36.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.36.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.36.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.37.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.37.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.37.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.37.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.37.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.38.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.38.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.38.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.38.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.38.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.39.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.39.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.39.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.39.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.39.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.40.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.40.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.40.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.40.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.40.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.41.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.41.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.41.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.41.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.41.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.42.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.42.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.42.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.42.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.42.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.43.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.43.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.43.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.43.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.43.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.44.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.44.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.44.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.44.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.44.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.45.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.45.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.45.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.45.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.45.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.46.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.46.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.46.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.46.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.46.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.47.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.47.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.47.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.47.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.47.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.48.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.48.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.48.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.48.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.48.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.49.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.49.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.49.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.49.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.49.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.50.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.50.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.50.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.50.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.50.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.51.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.51.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.51.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.51.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.51.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.52.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.52.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.52.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.52.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.52.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.53.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.53.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.53.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.53.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.53.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.54.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.54.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.54.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.54.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.54.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.55.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.55.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.55.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.55.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.55.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.56.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.56.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.56.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.56.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.56.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.57.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.57.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.57.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.57.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.57.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.58.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.58.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.58.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.58.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.58.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.59.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.59.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.59.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.59.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.59.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.60.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.60.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.60.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.60.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.60.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.61.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.61.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.61.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.61.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.61.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.62.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.62.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.62.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.62.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.62.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.63.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.63.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.63.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.63.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.63.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.64.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.64.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.64.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.64.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.64.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.65.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.65.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.65.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.65.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.65.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.66.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.66.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.66.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.66.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.66.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.67.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.67.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.67.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.67.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.67.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.68.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.68.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.68.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.68.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.68.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.69.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.69.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.69.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.69.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.69.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.70.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.70.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.70.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.70.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.70.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.71.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.71.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.71.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.71.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.71.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.72.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.72.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.72.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.72.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.72.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.73.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.73.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.73.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.73.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.73.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.74.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.74.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.74.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.74.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.74.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.75.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.75.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.75.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.75.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.75.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.76.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.76.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.76.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.76.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.76.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.77.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.77.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.77.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.77.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.77.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.78.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.78.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.78.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.78.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.78.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.79.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.79.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.79.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.79.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.79.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.80.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.80.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.80.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.80.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.80.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.81.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.81.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.81.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.81.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.81.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.82.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.82.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.82.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.82.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.82.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.83.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.83.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.83.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.83.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.83.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.84.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.84.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.84.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.84.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.84.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.85.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.85.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.85.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.85.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.85.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.86.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.86.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.86.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.86.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.86.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.87.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.87.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.87.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.87.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.87.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.88.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.88.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.88.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.88.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.88.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.89.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.89.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.89.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.89.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.89.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.90.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.90.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.90.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.90.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.90.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.91.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.91.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.91.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.91.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.91.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.92.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.92.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.92.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.92.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.92.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.93.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.93.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.93.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.93.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.93.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.94.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.94.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.94.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.94.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.94.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.95.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.95.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.95.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.95.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.95.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.96.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.96.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.96.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.96.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.96.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.97.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.97.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.97.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.97.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.97.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.98.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.98.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.98.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.98.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.98.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.99.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.99.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.99.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.99.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.99.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.100.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.100.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.100.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.100.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.100.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.101.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.101.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.101.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.101.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.101.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.102.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.102.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.102.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.102.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.102.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.103.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.103.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.103.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.103.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.103.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.104.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.104.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.104.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.104.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.104.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.105.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.105.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.105.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.105.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.105.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.106.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.106.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.106.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.106.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.106.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.107.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.107.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.107.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.107.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.107.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.108.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.108.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.108.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.108.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.108.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.109.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.109.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.109.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.109.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.109.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.110.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.110.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.110.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.110.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.110.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.111.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.111.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.111.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.111.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.111.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.112.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.112.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.112.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.112.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.112.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.113.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.113.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.113.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.113.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.113.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.114.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.114.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.114.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.114.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.114.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.115.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.115.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.115.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.115.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.115.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.116.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.116.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.116.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.116.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.116.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.117.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.117.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.117.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.117.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.117.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.118.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.118.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.118.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.118.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.118.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.119.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.119.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.119.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.119.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.119.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.120.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.120.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.120.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.120.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.120.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.121.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.121.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.121.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.121.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.121.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.122.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.122.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.122.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.122.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.122.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.123.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.123.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.123.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.123.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.123.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.124.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.124.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.124.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.124.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.124.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.125.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.125.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.125.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.125.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.125.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.126.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.126.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.126.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.126.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.126.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.127.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.127.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.127.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.127.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.127.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.128.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.128.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.128.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.128.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.128.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.129.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.129.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.129.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.129.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.129.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.130.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.130.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.130.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.130.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.130.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.131.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.131.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.131.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.131.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.131.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.132.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.132.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.132.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.132.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.132.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.133.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.133.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.133.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.133.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.133.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.134.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.134.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.134.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.134.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.134.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.135.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.135.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.135.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.135.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.135.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.136.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.136.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.136.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.136.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.136.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.137.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.137.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.137.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.137.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.137.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.138.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.138.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.138.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.138.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.138.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.139.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.139.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.139.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.139.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.139.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.140.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.140.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.140.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.140.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.140.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.141.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.141.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.141.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.141.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.141.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.142.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.142.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.142.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.142.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.142.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.143.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.143.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.143.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.143.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.143.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.144.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.144.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.144.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.144.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.144.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.145.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.145.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.145.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.145.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.145.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.146.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.146.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.146.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.146.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.146.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.147.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.147.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.147.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.147.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.147.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.148.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.148.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.148.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.148.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.148.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.149.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.149.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.149.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.149.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.149.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.150.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.150.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.150.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.150.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.150.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.151.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.151.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.151.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.151.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.151.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.152.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.152.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.152.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.152.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.152.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.153.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.153.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.153.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.153.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.153.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.154.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.154.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.154.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.154.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.154.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.155.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.155.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.155.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.155.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.155.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.156.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.156.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.156.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.156.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.156.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.157.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.157.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.157.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.157.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.157.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.158.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.158.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.158.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.158.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.158.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.159.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.159.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.159.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.159.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.159.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.160.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.160.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.160.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.160.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.160.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.160.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.161.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.161.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.161.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.161.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.161.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.161.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.162.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.162.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.162.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.162.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.162.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.162.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.163.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.163.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.163.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.163.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.163.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.163.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.164.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.164.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.164.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.164.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.164.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.164.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.165.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.165.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.165.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.165.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.165.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.165.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.166.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.166.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.166.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.166.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.166.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.166.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.167.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.167.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.167.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.167.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.167.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.167.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.168.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.168.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.168.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.168.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.168.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.168.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.169.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.169.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.169.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.169.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.169.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.169.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.170.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.170.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.170.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.170.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.170.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.170.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.171.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.171.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.171.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.171.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.171.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.171.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.172.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.172.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.172.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.172.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.172.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.172.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.173.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.173.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.173.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.173.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.173.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.173.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.174.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.174.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.174.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.174.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.174.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.174.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.175.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.175.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.175.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.175.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.175.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.175.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.176.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.176.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.176.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.176.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.176.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.176.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.177.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.177.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.177.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.177.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.177.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.177.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.178.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.178.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.178.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.178.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.178.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.178.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.179.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.179.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.179.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.179.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.179.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.179.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.180.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.180.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.180.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.180.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.180.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.180.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.181.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.181.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.181.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.181.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.181.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.181.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.182.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.182.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.182.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.182.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.182.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.182.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.183.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.183.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.183.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.183.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.183.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.183.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.184.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.184.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.184.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.184.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.184.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.184.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.185.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.185.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.185.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.185.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.185.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.185.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.186.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.186.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.186.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.186.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.186.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.186.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.187.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.187.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.187.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.187.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.187.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.187.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.188.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.188.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.188.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.188.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.188.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.188.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.189.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.189.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.189.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.189.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.189.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.189.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.190.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.190.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.190.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.190.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.190.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.190.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.191.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.191.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.191.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.191.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.191.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.191.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.192.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.192.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.192.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.192.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.192.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.192.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.193.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.193.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.193.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.193.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.193.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.193.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.194.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.194.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.194.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.194.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.194.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.194.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.195.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.195.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.195.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.195.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.195.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.195.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.196.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.196.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.196.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.196.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.196.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.196.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.197.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.197.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.197.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.197.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.197.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.197.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.198.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.198.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.198.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.198.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.198.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.198.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.199.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.199.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.199.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.199.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.199.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.199.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.200.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.200.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.200.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.200.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.200.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.200.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.201.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.201.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.201.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.201.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.201.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.201.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.202.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.202.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.202.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.202.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.202.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.202.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.203.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.203.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.203.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.203.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.203.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.203.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.204.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.204.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.204.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.204.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.204.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.204.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.205.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.205.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.205.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.205.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.205.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.205.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.206.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.206.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.206.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.206.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.206.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.206.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.207.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.207.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.207.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.207.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.207.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.207.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.208.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.208.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.208.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.208.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.208.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.208.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.209.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.209.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.209.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.209.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.209.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.209.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.210.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.210.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.210.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.210.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.210.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.210.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.211.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.211.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.211.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.211.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.211.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.211.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.212.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.212.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.212.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.212.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.212.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.212.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.213.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.213.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.213.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.213.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.213.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.213.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.214.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.214.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.214.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.214.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.214.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.214.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.215.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.215.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.215.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.215.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.215.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.215.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.216.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.216.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.216.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.216.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.216.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.216.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.217.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.217.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.217.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.217.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.217.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.217.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.218.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.218.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.218.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.218.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.218.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.218.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.219.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.219.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.219.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.219.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.219.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.219.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.220.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.220.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.220.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.220.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.220.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.220.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.221.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.221.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.221.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.221.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.221.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.221.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.222.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.222.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.222.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.222.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.222.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.222.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.223.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.223.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.223.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.223.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.223.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.223.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.224.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.224.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.224.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.224.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.224.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.224.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.225.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.225.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.225.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.225.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.225.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.225.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.226.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.226.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.226.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.226.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.226.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.226.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.227.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.227.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.227.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.227.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.227.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.227.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.228.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.228.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.228.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.228.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.228.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.228.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.229.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.229.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.229.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.229.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.229.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.229.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.230.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.230.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.230.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.230.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.230.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.230.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.231.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.231.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.231.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.231.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.231.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.231.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.232.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.232.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.232.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.232.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.232.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.232.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.233.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.233.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.233.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.233.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.233.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.233.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.234.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.234.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.234.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.234.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.234.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.234.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.235.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.235.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.235.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.235.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.235.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.235.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.236.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.236.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.236.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.236.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.236.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.236.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.237.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.237.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.237.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.237.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.237.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.237.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.238.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.238.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.238.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.238.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.238.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.238.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.239.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.239.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.239.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.239.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.239.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.239.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.240.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.240.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.240.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.240.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.240.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.240.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.241.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.241.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.241.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.241.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.241.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.241.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.242.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.242.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.242.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.242.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.242.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.242.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.243.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.243.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.243.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.243.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.243.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.243.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.244.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.244.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.244.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.244.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.244.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.244.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.245.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.245.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.245.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.245.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.245.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.245.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.246.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.246.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.246.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.246.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.246.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.246.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.247.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.247.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.247.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.247.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.247.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.247.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.248.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.248.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.248.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.248.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.248.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.248.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.249.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.249.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.249.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.249.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.249.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.249.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.250.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.250.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.250.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.250.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.250.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.250.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.251.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.251.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.251.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.251.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.251.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.251.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.252.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.252.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.252.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.252.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.252.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.252.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.253.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.253.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.253.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.253.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.253.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.253.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.254.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.254.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.254.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.254.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.254.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.254.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.255.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.255.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.255.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.255.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.255.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.255.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.input_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.24.post_attention_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.q_a_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.q_a_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.q_a_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.q_b_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.q_b_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.kv_b_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.kv_b_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.o_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.o_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.gate.weight": "model-00062-of-000163.safetensors", "model.layers.25.mlp.gate.e_score_correction_bias": "model-00062-of-000163.safetensors", "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.shared_experts.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.shared_experts.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.0.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.0.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.0.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.0.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.0.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.1.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.1.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.1.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.1.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.1.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.2.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.2.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.2.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.2.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.2.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.3.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.3.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.3.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.3.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.3.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.4.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.4.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.4.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.4.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.4.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.5.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.5.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.5.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.5.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.5.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.6.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.6.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.6.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.6.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.6.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.7.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.7.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.7.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.7.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.7.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.8.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.8.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.8.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.8.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.8.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.9.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.9.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.9.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.9.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.9.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.10.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.10.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.10.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.10.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.10.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.11.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.11.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.11.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.11.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.11.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.12.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.12.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.12.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.12.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.12.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.13.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.13.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.13.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.13.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.13.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.14.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.14.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.14.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.14.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.14.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.15.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.15.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.15.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.15.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.15.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.16.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.16.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.16.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.16.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.16.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.17.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.17.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.17.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.17.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.17.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.18.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.18.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.18.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.18.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.18.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.19.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.19.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.19.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.19.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.19.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.20.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.20.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.20.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.20.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.20.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.21.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.21.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.21.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.21.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.21.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.22.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.22.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.22.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.22.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.22.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.23.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.23.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.23.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.23.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.23.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.24.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.24.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.24.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.24.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.24.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.25.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.25.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.25.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.25.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.25.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.26.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.26.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.26.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.26.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.26.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.27.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.27.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.27.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.27.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.27.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.28.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.28.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.28.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.28.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.28.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.29.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.29.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.29.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.29.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.29.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.30.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.30.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.30.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.30.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.30.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.31.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.31.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.31.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.31.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.31.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.32.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.32.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.32.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.32.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.32.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.33.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.33.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.33.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.33.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.33.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.34.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.34.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.34.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.34.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.34.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.35.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.35.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.35.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.35.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.35.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.36.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.36.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.36.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.36.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.36.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.37.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.37.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.37.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.37.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.37.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.38.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.38.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.38.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.38.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.38.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.39.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.39.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.39.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.39.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.39.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.40.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.40.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.40.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.40.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.40.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.41.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.41.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.41.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.41.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.41.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.42.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.42.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.42.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.42.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.42.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.43.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.43.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.43.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.43.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.43.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.44.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.44.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.44.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.44.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.44.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.45.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.45.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.45.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.45.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.45.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.46.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.46.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.46.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.46.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.46.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.47.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.47.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.47.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.47.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.47.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.48.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.48.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.48.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.48.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.48.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.49.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.49.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.49.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.49.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.49.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.50.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.50.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.50.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.50.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.50.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.51.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.51.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.51.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.51.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.51.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.52.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.52.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.52.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.52.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.52.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.53.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.53.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.53.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.53.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.53.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.54.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.54.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.54.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.54.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.54.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.55.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.55.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.55.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.55.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.55.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.56.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.56.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.56.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.56.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.56.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.57.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.57.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.57.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.57.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.57.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.58.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.58.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.58.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.58.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.58.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.59.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.59.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.59.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.59.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.59.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.60.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.60.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.60.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.60.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.60.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.61.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.61.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.61.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.61.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.61.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.62.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.62.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.62.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.62.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.62.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.63.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.63.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.63.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.63.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.63.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.64.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.64.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.64.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.64.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.64.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.65.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.65.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.65.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.65.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.65.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.66.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.66.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.66.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.66.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.66.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.67.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.67.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.67.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.67.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.67.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.68.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.68.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.68.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.68.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.68.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.69.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.69.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.69.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.69.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.69.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.70.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.70.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.70.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.70.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.70.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.71.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.71.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.71.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.71.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.71.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.72.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.72.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.72.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.72.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.72.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.73.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.73.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.73.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.73.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.73.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.74.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.74.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.74.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.74.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.74.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.75.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.75.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.75.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.75.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.75.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.76.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.76.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.76.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.76.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.76.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.77.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.77.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.77.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.77.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.77.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.78.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.78.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.78.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.78.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.78.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.79.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.79.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.79.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.79.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.79.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.80.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.80.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.80.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.80.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.80.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.81.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.81.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.81.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.81.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.81.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.82.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.82.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.82.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.82.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.82.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.83.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.83.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.83.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.83.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.83.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.84.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.84.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.84.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.84.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.84.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.85.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.85.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.85.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.85.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.85.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.86.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.86.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.86.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.86.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.86.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.87.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.87.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.87.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.87.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.87.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.88.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.88.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.88.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.88.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.88.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.89.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.89.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.89.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.89.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.89.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.90.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.90.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.90.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.90.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.90.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.91.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.91.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.91.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.91.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.91.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.92.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.92.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.92.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.92.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.92.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.93.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.93.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.93.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.93.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.93.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.94.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.94.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.94.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.94.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.94.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.95.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.95.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.95.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.95.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.95.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.96.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.96.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.96.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.96.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.96.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.97.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.97.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.97.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.97.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.97.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.98.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.98.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.98.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.98.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.98.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.99.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.99.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.99.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.99.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.99.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.100.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.100.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.100.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.100.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.100.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.101.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.101.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.101.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.101.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.101.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.102.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.102.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.102.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.102.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.102.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.103.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.103.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.103.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.103.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.103.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.104.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.104.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.104.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.104.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.104.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.105.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.105.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.105.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.105.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.105.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.106.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.106.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.106.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.106.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.106.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.107.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.107.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.107.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.107.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.107.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.108.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.108.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.108.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.108.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.108.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.109.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.109.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.109.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.109.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.109.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.110.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.110.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.110.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.110.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.110.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.111.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.111.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.111.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.111.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.111.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.112.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.112.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.112.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.112.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.112.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.113.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.113.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.113.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.113.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.113.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.114.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.114.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.114.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.114.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.114.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.115.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.115.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.115.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.115.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.115.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.116.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.116.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.116.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.116.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.116.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.117.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.117.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.117.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.117.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.117.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.118.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.118.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.118.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.118.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.118.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.119.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.119.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.119.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.119.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.119.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.120.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.120.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.120.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.120.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.120.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.121.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.121.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.121.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.121.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.121.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.122.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.122.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.122.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.122.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.122.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.123.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.123.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.123.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.123.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.123.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.124.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.124.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.124.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.124.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.124.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.125.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.125.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.125.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.125.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.125.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.126.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.126.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.126.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.126.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.126.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.127.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.127.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.127.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.127.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.127.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.128.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.128.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.128.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.128.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.128.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.129.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.129.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.129.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.129.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.129.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.130.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.130.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.130.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.130.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.130.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.131.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.131.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.131.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.131.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.131.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.132.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.132.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.132.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.132.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.132.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.133.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.133.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.133.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.133.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.133.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.134.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.134.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.134.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.134.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.134.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.135.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.135.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.135.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.135.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.135.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.136.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.136.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.136.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.136.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.136.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.137.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.137.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.137.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.137.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.137.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.138.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.138.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.138.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.138.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.138.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.139.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.139.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.139.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.139.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.139.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.140.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.140.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.140.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.140.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.140.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.141.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.141.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.141.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.141.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.141.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.142.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.142.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.142.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.142.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.142.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.143.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.143.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.143.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.143.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.143.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.144.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.144.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.144.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.144.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.144.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.145.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.145.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.145.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.145.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.145.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.146.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.146.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.146.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.146.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.146.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.147.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.147.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.147.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.147.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.147.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.148.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.148.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.148.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.148.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.148.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.149.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.149.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.149.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.149.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.149.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.150.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.150.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.150.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.150.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.150.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.151.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.151.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.151.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.151.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.151.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.152.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.152.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.152.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.152.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.152.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.153.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.153.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.153.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.153.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.153.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.154.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.154.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.154.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.154.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.154.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.155.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.155.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.155.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.155.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.155.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.156.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.156.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.156.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.156.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.156.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.157.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.157.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.157.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.157.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.157.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.158.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.158.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.158.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.158.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.158.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.159.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.159.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.159.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.159.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.159.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.160.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.160.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.160.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.160.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.160.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.160.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.161.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.161.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.161.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.161.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.161.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.161.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.162.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.162.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.162.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.162.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.162.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.162.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.163.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.163.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.163.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.163.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.163.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.163.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.164.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.164.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.164.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.164.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.164.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.164.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.165.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.165.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.165.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.165.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.165.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.165.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.166.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.166.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.166.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.166.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.166.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.166.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.167.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.167.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.167.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.167.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.167.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.167.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.168.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.168.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.168.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.168.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.168.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.168.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.169.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.169.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.169.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.169.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.169.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.169.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.170.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.170.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.170.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.170.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.170.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.170.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.171.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.171.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.171.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.171.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.171.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.171.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.172.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.172.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.172.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.172.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.172.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.172.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.173.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.173.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.173.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.173.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.173.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.173.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.174.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.174.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.174.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.174.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.174.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.174.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.175.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.175.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.175.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.175.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.175.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.175.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.176.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.176.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.176.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.176.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.176.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.176.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.177.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.177.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.177.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.177.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.177.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.177.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.178.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.178.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.178.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.178.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.178.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.178.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.179.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.179.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.179.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.179.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.179.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.179.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.180.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.180.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.180.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.180.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.180.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.180.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.181.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.181.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.181.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.181.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.181.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.181.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.182.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.182.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.182.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.182.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.182.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.182.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.183.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.183.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.183.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.183.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.183.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.183.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.184.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.184.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.184.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.184.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.184.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.184.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.185.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.185.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.185.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.185.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.185.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.185.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.186.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.186.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.186.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.186.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.186.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.186.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.187.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.187.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.187.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.187.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.187.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.187.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.188.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.188.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.188.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.188.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.188.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.188.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.189.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.189.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.189.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.189.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.189.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.189.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.190.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.190.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.190.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.190.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.190.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.190.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.191.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.191.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.191.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.191.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.191.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.191.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.192.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.192.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.192.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.192.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.192.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.192.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.193.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.193.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.193.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.193.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.193.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.193.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.194.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.194.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.194.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.194.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.194.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.194.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.195.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.195.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.195.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.195.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.195.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.195.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.196.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.196.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.196.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.196.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.196.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.196.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.197.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.197.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.197.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.197.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.197.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.197.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.198.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.198.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.198.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.198.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.198.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.198.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.199.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.199.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.199.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.199.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.199.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.199.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.200.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.200.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.200.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.200.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.200.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.200.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.201.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.201.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.201.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.201.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.201.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.201.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.202.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.202.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.202.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.202.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.202.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.202.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.203.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.203.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.203.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.203.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.203.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.203.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.204.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.204.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.204.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.204.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.204.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.204.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.205.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.205.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.205.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.205.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.205.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.205.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.206.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.206.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.206.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.206.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.206.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.206.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.207.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.207.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.207.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.207.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.207.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.207.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.208.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.208.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.208.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.208.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.208.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.208.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.209.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.209.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.209.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.209.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.209.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.209.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.210.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.210.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.210.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.210.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.210.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.210.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.211.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.211.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.211.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.211.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.211.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.211.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.212.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.212.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.212.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.212.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.212.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.212.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.213.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.213.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.213.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.213.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.213.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.213.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.214.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.214.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.214.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.214.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.214.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.214.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.215.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.215.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.215.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.215.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.215.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.215.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.216.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.216.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.216.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.216.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.216.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.216.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.217.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.217.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.217.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.217.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.217.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.217.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.218.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.218.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.218.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.218.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.218.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.218.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.219.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.219.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.219.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.219.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.219.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.219.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.220.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.220.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.220.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.220.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.220.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.220.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.221.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.221.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.221.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.221.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.221.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.221.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.222.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.222.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.222.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.222.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.222.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.222.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.223.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.223.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.223.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.223.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.223.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.223.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.224.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.224.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.224.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.224.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.224.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.224.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.225.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.225.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.225.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.225.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.225.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.225.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.226.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.226.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.226.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.226.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.226.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.226.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.227.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.227.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.227.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.227.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.227.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.227.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.228.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.228.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.228.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.228.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.228.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.228.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.229.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.229.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.229.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.229.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.229.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.229.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.230.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.230.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.230.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.230.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.230.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.230.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.231.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.231.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.231.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.231.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.231.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.231.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.232.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.232.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.232.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.232.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.232.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.232.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.233.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.233.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.233.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.233.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.233.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.233.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.234.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.234.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.234.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.234.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.234.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.234.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.235.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.235.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.235.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.235.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.235.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.235.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.236.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.236.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.236.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.236.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.236.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.236.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.237.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.237.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.237.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.237.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.237.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.237.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.238.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.238.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.238.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.238.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.238.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.238.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.239.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.239.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.239.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.239.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.239.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.239.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.240.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.240.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.240.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.240.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.240.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.240.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.241.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.241.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.241.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.241.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.241.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.241.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.242.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.242.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.242.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.242.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.242.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.242.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.243.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.243.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.243.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.243.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.243.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.243.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.244.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.244.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.244.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.244.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.244.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.244.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.245.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.245.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.245.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.245.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.245.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.245.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.246.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.246.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.246.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.246.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.246.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.246.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.247.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.247.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.247.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.247.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.247.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.247.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.248.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.248.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.248.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.248.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.248.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.248.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.249.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.249.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.249.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.249.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.249.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.249.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.250.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.250.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.250.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.250.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.250.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.250.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.251.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.251.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.251.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.251.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.251.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.251.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.252.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.252.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.252.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.252.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.252.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.252.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.253.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.253.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.253.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.253.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.253.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.253.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.254.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.254.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.254.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.254.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.254.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.254.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.255.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.255.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.255.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.255.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.255.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.255.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.input_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.25.post_attention_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.q_a_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.q_a_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.q_a_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.q_b_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.q_b_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.kv_b_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.kv_b_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.o_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.o_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.gate.weight": "model-00065-of-000163.safetensors", "model.layers.26.mlp.gate.e_score_correction_bias": "model-00065-of-000163.safetensors", "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.shared_experts.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.shared_experts.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.0.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.0.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.0.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.0.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.0.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.1.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.1.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.1.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.1.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.1.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.2.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.2.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.2.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.2.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.2.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.3.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.3.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.3.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.3.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.3.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.4.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.4.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.4.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.4.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.4.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.5.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.5.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.5.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.5.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.5.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.6.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.6.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.6.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.6.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.6.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.7.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.7.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.7.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.7.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.7.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.8.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.8.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.8.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.8.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.8.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.9.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.9.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.9.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.9.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.9.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.10.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.10.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.10.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.10.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.10.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.11.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.11.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.11.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.11.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.11.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.12.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.12.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.12.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.12.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.12.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.13.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.13.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.13.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.13.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.13.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.14.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.14.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.14.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.14.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.14.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.15.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.15.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.15.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.15.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.15.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.16.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.16.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.16.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.16.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.16.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.17.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.17.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.17.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.17.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.17.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.18.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.18.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.18.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.18.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.18.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.19.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.19.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.19.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.19.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.19.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.20.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.20.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.20.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.20.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.20.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.21.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.21.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.21.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.21.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.21.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.22.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.22.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.22.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.22.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.22.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.23.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.23.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.23.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.23.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.23.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.24.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.24.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.24.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.24.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.24.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.25.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.25.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.25.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.25.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.25.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.26.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.26.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.26.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.26.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.26.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.27.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.27.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.27.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.27.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.27.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.28.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.28.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.28.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.28.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.28.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.29.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.29.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.29.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.29.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.29.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.30.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.30.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.30.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.30.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.30.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.31.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.31.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.31.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.31.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.31.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.32.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.32.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.32.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.32.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.32.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.33.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.33.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.33.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.33.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.33.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.34.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.34.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.34.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.34.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.34.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.35.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.35.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.35.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.35.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.35.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.36.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.36.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.36.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.36.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.36.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.37.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.37.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.37.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.37.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.37.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.38.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.38.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.38.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.38.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.38.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.39.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.39.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.39.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.39.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.39.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.40.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.40.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.40.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.40.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.40.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.41.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.41.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.41.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.41.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.41.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.42.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.42.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.42.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.42.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.42.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.43.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.43.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.43.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.43.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.43.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.44.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.44.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.44.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.44.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.44.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.45.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.45.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.45.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.45.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.45.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.46.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.46.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.46.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.46.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.46.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.47.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.47.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.47.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.47.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.47.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.48.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.48.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.48.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.48.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.48.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.49.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.49.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.49.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.49.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.49.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.50.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.50.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.50.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.50.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.50.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.51.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.51.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.51.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.51.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.51.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.52.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.52.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.52.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.52.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.52.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.53.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.53.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.53.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.53.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.53.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.54.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.54.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.54.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.54.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.54.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.55.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.55.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.55.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.55.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.55.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.56.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.56.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.56.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.56.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.56.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.57.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.57.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.57.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.57.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.57.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.58.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.58.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.58.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.58.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.58.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.59.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.59.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.59.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.59.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.59.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.60.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.60.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.60.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.60.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.60.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.61.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.61.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.61.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.61.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.61.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.62.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.62.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.62.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.62.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.62.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.63.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.63.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.63.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.63.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.63.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.64.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.64.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.64.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.64.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.64.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.65.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.65.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.65.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.65.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.65.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.66.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.66.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.66.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.66.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.66.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.67.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.67.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.67.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.67.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.67.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.68.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.68.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.68.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.68.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.68.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.69.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.69.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.69.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.69.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.69.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.70.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.70.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.70.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.70.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.70.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.71.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.71.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.71.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.71.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.71.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.72.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.72.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.72.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.72.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.72.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.73.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.73.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.73.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.73.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.73.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.74.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.74.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.74.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.74.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.74.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.75.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.75.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.75.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.75.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.75.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.76.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.76.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.76.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.76.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.76.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.77.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.77.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.77.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.77.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.77.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.78.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.78.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.78.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.78.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.78.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.79.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.79.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.79.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.79.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.79.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.80.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.80.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.80.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.80.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.80.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.81.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.81.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.81.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.81.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.81.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.82.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.82.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.82.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.82.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.82.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.83.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.83.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.83.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.83.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.83.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.84.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.84.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.84.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.84.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.84.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.85.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.85.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.85.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.85.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.85.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.86.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.86.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.86.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.86.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.86.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.87.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.87.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.87.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.87.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.87.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.88.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.88.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.88.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.88.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.88.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.89.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.89.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.89.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.89.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.89.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.90.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.90.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.90.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.90.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.90.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.91.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.91.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.91.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.91.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.91.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.92.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.92.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.92.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.92.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.92.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.93.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.93.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.93.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.93.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.93.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.94.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.94.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.94.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.94.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.94.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.95.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.95.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.95.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.95.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.95.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.96.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.96.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.96.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.96.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.96.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.97.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.97.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.97.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.97.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.97.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.98.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.98.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.98.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.98.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.98.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.99.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.99.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.99.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.99.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.99.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.100.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.100.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.100.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.100.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.100.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.101.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.101.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.101.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.101.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.101.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.102.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.102.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.102.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.102.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.102.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.103.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.103.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.103.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.103.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.103.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.104.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.104.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.104.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.104.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.104.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.105.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.105.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.105.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.105.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.105.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.106.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.106.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.106.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.106.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.106.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.107.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.107.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.107.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.107.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.107.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.108.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.108.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.108.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.108.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.108.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.109.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.109.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.109.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.109.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.109.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.110.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.110.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.110.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.110.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.110.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.111.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.111.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.111.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.111.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.111.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.112.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.112.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.112.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.112.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.112.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.113.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.113.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.113.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.113.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.113.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.114.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.114.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.114.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.114.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.114.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.115.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.115.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.115.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.115.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.115.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.116.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.116.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.116.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.116.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.116.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.117.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.117.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.117.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.117.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.117.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.118.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.118.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.118.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.118.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.118.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.119.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.119.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.119.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.119.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.119.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.120.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.120.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.120.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.120.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.120.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.121.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.121.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.121.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.121.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.121.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.122.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.122.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.122.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.122.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.122.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.123.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.123.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.123.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.123.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.123.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.124.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.124.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.124.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.124.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.124.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.125.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.125.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.125.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.125.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.125.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.126.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.126.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.126.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.126.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.126.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.127.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.127.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.127.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.127.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.127.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.128.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.128.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.128.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.128.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.128.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.129.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.129.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.129.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.129.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.129.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.130.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.130.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.130.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.130.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.130.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.131.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.131.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.131.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.131.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.131.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.132.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.132.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.132.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.132.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.132.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.133.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.133.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.133.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.133.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.133.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.134.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.134.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.134.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.134.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.134.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.135.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.135.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.135.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.135.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.135.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.136.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.136.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.136.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.136.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.136.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.137.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.137.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.137.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.137.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.137.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.138.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.138.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.138.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.138.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.138.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.139.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.139.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.139.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.139.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.139.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.140.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.140.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.140.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.140.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.140.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.141.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.141.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.141.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.141.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.141.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.142.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.142.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.142.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.142.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.142.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.143.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.143.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.143.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.143.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.143.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.144.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.144.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.144.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.144.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.144.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.145.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.145.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.145.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.145.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.145.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.146.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.146.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.146.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.146.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.146.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.147.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.147.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.147.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.147.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.147.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.148.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.148.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.148.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.148.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.148.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.149.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.149.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.149.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.149.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.149.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.150.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.150.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.150.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.150.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.150.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.151.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.151.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.151.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.151.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.151.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.152.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.152.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.152.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.152.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.152.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.153.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.153.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.153.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.153.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.153.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.154.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.154.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.154.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.154.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.154.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.155.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.155.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.155.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.155.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.155.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.156.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.156.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.156.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.156.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.156.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.157.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.157.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.157.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.157.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.157.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.158.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.158.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.158.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.158.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.158.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.159.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.159.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.159.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.159.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.159.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.160.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.160.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.160.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.160.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.160.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.160.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.161.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.161.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.161.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.161.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.161.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.161.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.162.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.162.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.162.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.162.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.162.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.162.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.163.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.163.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.163.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.163.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.163.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.163.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.164.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.164.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.164.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.164.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.164.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.164.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.165.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.165.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.165.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.165.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.165.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.165.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.166.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.166.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.166.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.166.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.166.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.166.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.167.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.167.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.167.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.167.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.167.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.167.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.168.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.168.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.168.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.168.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.168.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.168.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.169.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.169.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.169.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.169.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.169.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.169.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.170.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.170.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.170.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.170.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.170.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.170.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.171.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.171.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.171.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.171.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.171.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.171.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.172.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.172.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.172.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.172.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.172.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.172.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.173.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.173.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.173.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.173.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.173.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.173.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.174.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.174.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.174.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.174.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.174.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.174.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.175.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.175.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.175.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.175.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.175.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.175.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.176.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.176.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.176.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.176.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.176.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.176.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.177.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.177.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.177.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.177.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.177.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.177.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.178.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.178.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.178.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.178.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.178.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.178.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.179.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.179.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.179.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.179.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.179.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.179.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.180.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.180.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.180.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.180.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.180.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.180.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.181.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.181.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.181.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.181.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.181.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.181.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.182.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.182.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.182.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.182.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.182.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.182.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.183.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.183.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.183.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.183.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.183.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.183.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.184.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.184.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.184.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.184.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.184.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.184.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.185.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.185.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.185.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.185.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.185.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.185.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.186.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.186.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.186.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.186.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.186.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.186.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.187.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.187.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.187.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.187.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.187.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.187.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.188.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.188.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.188.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.188.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.188.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.188.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.189.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.189.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.189.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.189.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.189.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.189.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.190.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.190.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.190.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.190.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.190.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.190.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.191.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.191.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.191.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.191.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.191.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.191.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.192.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.192.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.192.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.192.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.192.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.192.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.193.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.193.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.193.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.193.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.193.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.193.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.194.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.194.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.194.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.194.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.194.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.194.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.195.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.195.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.195.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.195.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.195.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.195.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.196.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.196.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.196.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.196.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.196.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.196.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.197.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.197.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.197.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.197.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.197.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.197.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.198.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.198.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.198.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.198.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.198.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.198.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.199.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.199.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.199.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.199.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.199.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.199.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.200.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.200.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.200.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.200.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.200.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.200.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.201.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.201.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.201.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.201.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.201.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.201.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.202.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.202.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.202.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.202.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.202.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.202.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.203.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.203.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.203.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.203.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.203.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.203.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.204.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.204.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.204.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.204.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.204.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.204.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.205.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.205.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.205.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.205.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.205.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.205.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.206.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.206.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.206.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.206.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.206.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.206.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.207.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.207.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.207.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.207.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.207.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.207.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.208.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.208.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.208.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.208.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.208.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.208.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.209.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.209.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.209.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.209.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.209.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.209.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.210.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.210.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.210.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.210.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.210.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.210.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.211.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.211.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.211.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.211.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.211.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.211.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.212.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.212.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.212.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.212.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.212.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.212.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.213.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.213.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.213.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.213.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.213.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.213.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.214.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.214.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.214.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.214.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.214.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.214.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.215.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.215.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.215.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.215.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.215.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.215.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.216.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.216.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.216.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.216.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.216.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.216.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.217.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.217.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.217.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.217.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.217.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.217.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.218.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.218.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.218.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.218.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.218.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.218.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.219.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.219.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.219.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.219.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.219.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.219.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.220.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.220.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.220.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.220.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.220.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.220.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.221.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.221.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.221.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.221.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.221.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.221.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.222.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.222.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.222.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.222.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.222.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.222.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.223.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.223.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.223.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.223.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.223.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.223.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.224.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.224.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.224.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.224.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.224.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.224.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.225.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.225.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.225.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.225.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.225.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.225.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.226.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.226.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.226.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.226.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.226.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.226.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.227.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.227.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.227.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.227.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.227.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.227.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.228.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.228.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.228.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.228.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.228.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.228.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.229.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.229.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.229.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.229.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.229.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.229.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.230.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.230.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.230.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.230.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.230.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.230.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.231.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.231.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.231.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.231.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.231.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.231.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.232.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.232.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.232.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.232.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.232.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.232.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.233.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.233.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.233.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.233.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.233.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.233.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.234.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.234.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.234.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.234.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.234.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.234.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.235.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.235.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.235.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.235.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.235.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.235.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.236.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.236.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.236.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.236.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.236.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.236.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.237.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.237.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.237.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.237.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.237.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.237.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.238.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.238.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.238.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.238.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.238.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.238.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.239.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.239.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.239.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.239.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.239.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.239.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.240.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.240.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.240.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.240.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.240.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.240.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.241.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.241.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.241.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.241.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.241.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.241.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.242.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.242.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.242.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.242.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.242.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.242.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.243.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.243.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.243.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.243.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.243.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.243.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.244.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.244.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.244.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.244.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.244.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.244.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.245.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.245.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.245.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.245.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.245.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.245.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.246.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.246.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.246.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.246.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.246.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.246.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.247.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.247.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.247.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.247.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.247.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.247.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.248.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.248.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.248.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.248.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.248.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.248.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.249.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.249.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.249.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.249.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.249.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.249.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.250.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.250.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.250.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.250.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.250.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.250.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.251.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.251.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.251.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.251.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.251.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.251.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.252.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.252.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.252.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.252.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.252.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.252.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.253.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.253.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.253.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.253.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.253.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.253.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.254.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.254.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.254.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.254.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.254.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.254.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.255.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.255.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.255.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.255.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.255.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.255.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.input_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.26.post_attention_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.q_a_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.q_a_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.q_a_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.q_b_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.q_b_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.kv_b_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.kv_b_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.o_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.o_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.gate.weight": "model-00067-of-000163.safetensors", "model.layers.27.mlp.gate.e_score_correction_bias": "model-00067-of-000163.safetensors", "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.shared_experts.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.shared_experts.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.0.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.0.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.0.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.0.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.0.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.1.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.1.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.1.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.1.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.1.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.2.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.2.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.2.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.2.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.2.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.3.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.3.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.3.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.3.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.3.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.4.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.4.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.4.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.4.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.4.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.5.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.5.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.5.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.5.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.5.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.6.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.6.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.6.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.6.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.6.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.7.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.7.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.7.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.7.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.7.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.8.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.8.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.8.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.8.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.8.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.9.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.9.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.9.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.9.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.9.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.10.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.10.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.10.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.10.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.10.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.11.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.11.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.11.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.11.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.11.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.12.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.12.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.12.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.12.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.12.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.13.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.13.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.13.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.13.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.13.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.14.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.14.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.14.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.14.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.14.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.15.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.15.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.15.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.15.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.15.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.16.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.16.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.16.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.16.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.16.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.17.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.17.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.17.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.17.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.17.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.18.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.18.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.18.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.18.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.18.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.19.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.19.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.19.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.19.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.19.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.20.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.20.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.20.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.20.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.20.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.21.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.21.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.21.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.21.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.21.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.22.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.22.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.22.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.22.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.22.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.23.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.23.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.23.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.23.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.23.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.24.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.24.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.24.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.24.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.24.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.25.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.25.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.25.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.25.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.25.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.26.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.26.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.26.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.26.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.26.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.27.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.27.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.27.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.27.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.27.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.28.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.28.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.28.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.28.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.28.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.29.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.29.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.29.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.29.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.29.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.30.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.30.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.30.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.30.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.30.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.31.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.31.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.31.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.31.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.31.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.32.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.32.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.32.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.32.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.32.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.33.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.33.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.33.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.33.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.33.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.34.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.34.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.34.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.34.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.34.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.35.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.35.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.35.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.35.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.35.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.36.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.36.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.36.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.36.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.36.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.37.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.37.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.37.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.37.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.37.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.38.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.38.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.38.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.38.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.38.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.39.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.39.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.39.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.39.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.39.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.40.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.40.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.40.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.40.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.40.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.41.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.41.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.41.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.41.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.41.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.42.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.42.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.42.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.42.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.42.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.43.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.43.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.43.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.43.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.43.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.44.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.44.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.44.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.44.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.44.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.45.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.45.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.45.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.45.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.45.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.46.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.46.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.46.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.46.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.46.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.47.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.47.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.47.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.47.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.47.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.48.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.48.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.48.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.48.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.48.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.49.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.49.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.49.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.49.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.49.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.50.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.50.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.50.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.50.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.50.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.51.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.51.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.51.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.51.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.51.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.52.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.52.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.52.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.52.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.52.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.53.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.53.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.53.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.53.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.53.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.54.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.54.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.54.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.54.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.54.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.55.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.55.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.55.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.55.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.55.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.56.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.56.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.56.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.56.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.56.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.57.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.57.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.57.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.57.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.57.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.58.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.58.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.58.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.58.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.58.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.59.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.59.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.59.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.59.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.59.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.60.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.60.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.60.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.60.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.60.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.61.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.61.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.61.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.61.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.61.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.62.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.62.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.62.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.62.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.62.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.63.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.63.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.63.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.63.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.63.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.64.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.64.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.64.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.64.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.64.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.65.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.65.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.65.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.65.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.65.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.66.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.66.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.66.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.66.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.66.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.67.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.67.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.67.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.67.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.67.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.68.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.68.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.68.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.68.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.68.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.69.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.69.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.69.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.69.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.69.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.70.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.70.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.70.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.70.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.70.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.71.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.71.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.71.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.71.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.71.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.72.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.72.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.72.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.72.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.72.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.73.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.73.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.73.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.73.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.73.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.74.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.74.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.74.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.74.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.74.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.75.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.75.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.75.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.75.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.75.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.76.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.76.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.76.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.76.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.76.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.77.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.77.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.77.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.77.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.77.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.78.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.78.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.78.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.78.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.78.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.79.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.79.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.79.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.79.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.79.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.80.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.80.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.80.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.80.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.80.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.81.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.81.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.81.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.81.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.81.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.82.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.82.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.82.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.82.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.82.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.83.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.83.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.83.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.83.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.83.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.84.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.84.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.84.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.84.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.84.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.85.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.85.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.85.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.85.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.85.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.86.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.86.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.86.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.86.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.86.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.87.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.87.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.87.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.87.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.87.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.88.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.88.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.88.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.88.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.88.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.89.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.89.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.89.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.89.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.89.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.90.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.90.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.90.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.90.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.90.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.91.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.91.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.91.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.91.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.91.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.92.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.92.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.92.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.92.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.92.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.93.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.93.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.93.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.93.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.93.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.94.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.94.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.94.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.94.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.94.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.95.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.95.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.95.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.95.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.95.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.96.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.96.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.96.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.96.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.96.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.97.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.97.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.97.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.97.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.97.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.98.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.98.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.98.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.98.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.98.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.99.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.99.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.99.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.99.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.99.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.100.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.100.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.100.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.100.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.100.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.101.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.101.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.101.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.101.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.101.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.102.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.102.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.102.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.102.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.102.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.103.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.103.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.103.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.103.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.103.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.104.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.104.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.104.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.104.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.104.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.105.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.105.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.105.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.105.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.105.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.106.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.106.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.106.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.106.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.106.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.107.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.107.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.107.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.107.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.107.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.108.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.108.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.108.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.108.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.108.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.109.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.109.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.109.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.109.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.109.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.110.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.110.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.110.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.110.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.110.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.111.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.111.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.111.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.111.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.111.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.112.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.112.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.112.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.112.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.112.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.113.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.113.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.113.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.113.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.113.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.114.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.114.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.114.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.114.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.114.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.115.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.115.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.115.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.115.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.115.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.116.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.116.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.116.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.116.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.116.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.117.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.117.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.117.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.117.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.117.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.118.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.118.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.118.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.118.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.118.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.119.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.119.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.119.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.119.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.119.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.120.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.120.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.120.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.120.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.120.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.121.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.121.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.121.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.121.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.121.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.122.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.122.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.122.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.122.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.122.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.123.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.123.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.123.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.123.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.123.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.124.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.124.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.124.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.124.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.124.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.125.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.125.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.125.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.125.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.125.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.126.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.126.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.126.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.126.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.126.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.127.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.127.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.127.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.127.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.127.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.128.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.128.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.128.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.128.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.128.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.129.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.129.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.129.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.129.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.129.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.130.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.130.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.130.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.130.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.130.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.131.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.131.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.131.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.131.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.131.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.132.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.132.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.132.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.132.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.132.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.133.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.133.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.133.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.133.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.133.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.134.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.134.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.134.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.134.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.134.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.135.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.135.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.135.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.135.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.135.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.136.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.136.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.136.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.136.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.136.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.137.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.137.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.137.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.137.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.137.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.138.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.138.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.138.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.138.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.138.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.139.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.139.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.139.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.139.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.139.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.140.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.140.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.140.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.140.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.140.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.141.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.141.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.141.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.141.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.141.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.142.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.142.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.142.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.142.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.142.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.143.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.143.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.143.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.143.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.143.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.144.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.144.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.144.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.144.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.144.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.145.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.145.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.145.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.145.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.145.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.146.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.146.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.146.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.146.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.146.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.147.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.147.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.147.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.147.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.147.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.148.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.148.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.148.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.148.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.148.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.149.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.149.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.149.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.149.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.149.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.150.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.150.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.150.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.150.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.150.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.151.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.151.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.151.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.151.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.151.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.152.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.152.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.152.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.152.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.152.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.153.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.153.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.153.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.153.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.153.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.154.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.154.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.154.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.154.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.154.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.155.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.155.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.155.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.155.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.155.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.156.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.156.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.156.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.156.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.156.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.157.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.157.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.157.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.157.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.157.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.158.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.158.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.158.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.158.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.158.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.159.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.159.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.159.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.159.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.159.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.160.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.160.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.160.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.160.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.160.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.160.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.161.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.161.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.161.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.161.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.161.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.161.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.162.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.162.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.162.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.162.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.162.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.162.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.163.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.163.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.163.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.163.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.163.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.163.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.164.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.164.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.164.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.164.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.164.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.164.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.165.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.165.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.165.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.165.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.165.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.165.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.166.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.166.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.166.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.166.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.166.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.166.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.167.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.167.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.167.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.167.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.167.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.167.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.168.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.168.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.168.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.168.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.168.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.168.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.169.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.169.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.169.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.169.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.169.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.169.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.170.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.170.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.170.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.170.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.170.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.170.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.171.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.171.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.171.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.171.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.171.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.171.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.172.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.172.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.172.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.172.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.172.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.172.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.173.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.173.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.173.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.173.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.173.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.173.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.174.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.174.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.174.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.174.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.174.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.174.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.175.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.175.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.175.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.175.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.175.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.175.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.176.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.176.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.176.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.176.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.176.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.176.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.177.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.177.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.177.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.177.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.177.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.177.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.178.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.178.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.178.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.178.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.178.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.178.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.179.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.179.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.179.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.179.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.179.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.179.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.180.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.180.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.180.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.180.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.180.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.180.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.181.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.181.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.181.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.181.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.181.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.181.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.182.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.182.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.182.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.182.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.182.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.182.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.183.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.183.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.183.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.183.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.183.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.183.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.184.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.184.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.184.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.184.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.184.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.184.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.185.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.185.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.185.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.185.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.185.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.185.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.186.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.186.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.186.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.186.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.186.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.186.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.187.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.187.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.187.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.187.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.187.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.187.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.188.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.188.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.188.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.188.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.188.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.188.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.189.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.189.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.189.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.189.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.189.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.189.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.190.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.190.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.190.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.190.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.190.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.190.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.191.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.191.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.191.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.191.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.191.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.191.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.192.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.192.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.192.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.192.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.192.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.192.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.193.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.193.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.193.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.193.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.193.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.193.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.194.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.194.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.194.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.194.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.194.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.194.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.195.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.195.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.195.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.195.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.195.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.195.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.196.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.196.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.196.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.196.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.196.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.196.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.197.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.197.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.197.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.197.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.197.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.197.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.198.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.198.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.198.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.198.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.198.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.198.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.199.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.199.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.199.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.199.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.199.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.199.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.200.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.200.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.200.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.200.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.200.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.200.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.201.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.201.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.201.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.201.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.201.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.201.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.202.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.202.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.202.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.202.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.202.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.202.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.203.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.203.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.203.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.203.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.203.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.203.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.204.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.204.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.204.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.204.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.204.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.204.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.205.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.205.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.205.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.205.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.205.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.205.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.206.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.206.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.206.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.206.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.206.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.206.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.207.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.207.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.207.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.207.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.207.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.207.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.208.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.208.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.208.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.208.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.208.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.208.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.209.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.209.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.209.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.209.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.209.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.209.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.210.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.210.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.210.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.210.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.210.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.210.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.211.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.211.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.211.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.211.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.211.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.211.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.212.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.212.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.212.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.212.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.212.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.212.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.213.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.213.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.213.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.213.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.213.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.213.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.214.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.214.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.214.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.214.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.214.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.214.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.215.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.215.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.215.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.215.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.215.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.215.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.216.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.216.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.216.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.216.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.216.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.216.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.217.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.217.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.217.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.217.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.217.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.217.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.218.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.218.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.218.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.218.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.218.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.218.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.219.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.219.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.219.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.219.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.219.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.219.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.220.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.220.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.220.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.220.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.220.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.220.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.221.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.221.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.221.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.221.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.221.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.221.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.222.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.222.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.222.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.222.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.222.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.222.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.223.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.223.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.223.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.223.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.223.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.223.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.224.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.224.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.224.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.224.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.224.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.224.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.225.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.225.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.225.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.225.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.225.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.225.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.226.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.226.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.226.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.226.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.226.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.226.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.227.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.227.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.227.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.227.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.227.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.227.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.228.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.228.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.228.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.228.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.228.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.228.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.229.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.229.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.229.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.229.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.229.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.229.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.230.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.230.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.230.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.230.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.230.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.230.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.231.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.231.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.231.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.231.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.231.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.231.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.232.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.232.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.232.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.232.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.232.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.232.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.233.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.233.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.233.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.233.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.233.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.233.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.234.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.234.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.234.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.234.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.234.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.234.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.235.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.235.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.235.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.235.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.235.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.235.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.236.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.236.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.236.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.236.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.236.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.236.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.237.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.237.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.237.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.237.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.237.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.237.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.238.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.238.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.238.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.238.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.238.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.238.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.239.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.239.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.239.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.239.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.239.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.239.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.240.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.240.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.240.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.240.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.240.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.240.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.241.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.241.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.241.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.241.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.241.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.241.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.242.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.242.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.242.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.242.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.242.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.242.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.243.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.243.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.243.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.243.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.243.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.243.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.244.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.244.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.244.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.244.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.244.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.244.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.245.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.245.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.245.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.245.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.245.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.245.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.246.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.246.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.246.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.246.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.246.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.246.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.247.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.247.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.247.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.247.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.247.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.247.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.248.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.248.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.248.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.248.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.248.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.248.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.249.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.249.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.249.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.249.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.249.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.249.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.250.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.250.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.250.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.250.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.250.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.250.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.251.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.251.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.251.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.251.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.251.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.251.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.252.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.252.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.252.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.252.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.252.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.252.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.253.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.253.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.253.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.253.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.253.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.253.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.254.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.254.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.254.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.254.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.254.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.254.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.255.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.255.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.255.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.255.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.255.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.255.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.input_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.27.post_attention_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.q_a_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.q_a_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.q_a_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.q_b_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.q_b_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.kv_b_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.kv_b_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.o_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.o_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.gate.weight": "model-00070-of-000163.safetensors", "model.layers.28.mlp.gate.e_score_correction_bias": "model-00070-of-000163.safetensors", "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.shared_experts.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.shared_experts.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.0.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.0.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.0.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.0.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.0.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.1.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.1.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.1.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.1.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.1.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.2.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.2.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.2.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.2.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.2.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.3.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.3.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.3.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.3.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.3.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.4.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.4.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.4.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.4.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.4.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.5.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.5.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.5.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.5.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.5.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.6.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.6.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.6.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.6.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.6.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.7.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.7.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.7.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.7.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.7.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.8.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.8.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.8.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.8.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.8.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.9.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.9.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.9.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.9.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.9.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.10.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.10.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.10.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.10.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.10.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.11.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.11.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.11.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.11.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.11.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.12.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.12.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.12.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.12.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.12.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.13.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.13.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.13.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.13.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.13.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.14.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.14.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.14.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.14.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.14.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.15.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.15.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.15.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.15.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.15.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.16.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.16.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.16.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.16.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.16.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.17.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.17.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.17.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.17.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.17.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.18.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.18.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.18.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.18.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.18.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.19.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.19.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.19.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.19.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.19.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.20.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.20.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.20.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.20.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.20.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.21.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.21.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.21.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.21.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.21.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.22.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.22.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.22.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.22.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.22.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.23.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.23.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.23.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.23.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.23.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.24.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.24.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.24.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.24.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.24.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.25.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.25.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.25.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.25.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.25.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.26.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.26.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.26.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.26.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.26.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.27.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.27.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.27.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.27.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.27.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.28.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.28.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.28.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.28.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.28.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.29.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.29.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.29.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.29.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.29.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.30.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.30.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.30.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.30.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.30.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.31.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.31.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.31.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.31.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.31.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.32.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.32.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.32.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.32.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.32.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.33.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.33.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.33.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.33.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.33.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.34.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.34.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.34.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.34.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.34.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.35.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.35.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.35.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.35.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.35.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.36.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.36.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.36.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.36.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.36.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.37.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.37.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.37.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.37.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.37.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.38.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.38.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.38.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.38.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.38.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.39.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.39.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.39.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.39.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.39.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.40.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.40.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.40.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.40.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.40.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.41.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.41.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.41.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.41.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.41.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.42.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.42.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.42.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.42.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.42.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.43.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.43.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.43.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.43.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.43.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.44.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.44.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.44.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.44.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.44.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.45.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.45.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.45.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.45.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.45.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.46.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.46.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.46.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.46.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.46.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.47.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.47.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.47.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.47.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.47.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.48.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.48.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.48.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.48.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.48.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.49.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.49.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.49.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.49.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.49.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.50.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.50.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.50.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.50.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.50.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.51.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.51.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.51.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.51.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.51.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.52.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.52.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.52.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.52.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.52.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.53.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.53.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.53.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.53.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.53.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.54.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.54.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.54.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.54.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.54.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.55.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.55.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.55.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.55.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.55.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.56.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.56.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.56.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.56.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.56.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.57.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.57.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.57.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.57.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.57.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.58.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.58.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.58.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.58.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.58.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.59.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.59.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.59.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.59.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.59.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.60.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.60.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.60.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.60.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.60.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.61.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.61.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.61.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.61.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.61.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.62.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.62.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.62.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.62.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.62.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.63.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.63.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.63.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.63.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.63.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.64.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.64.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.64.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.64.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.64.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.65.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.65.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.65.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.65.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.65.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.66.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.66.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.66.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.66.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.66.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.67.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.67.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.67.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.67.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.67.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.68.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.68.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.68.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.68.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.68.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.69.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.69.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.69.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.69.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.69.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.70.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.70.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.70.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.70.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.70.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.71.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.71.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.71.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.71.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.71.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.72.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.72.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.72.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.72.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.72.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.73.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.73.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.73.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.73.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.73.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.74.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.74.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.74.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.74.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.74.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.75.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.75.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.75.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.75.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.75.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.76.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.76.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.76.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.76.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.76.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.77.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.77.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.77.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.77.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.77.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.78.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.78.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.78.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.78.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.78.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.79.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.79.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.79.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.79.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.79.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.80.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.80.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.80.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.80.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.80.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.81.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.81.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.81.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.81.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.81.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.82.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.82.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.82.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.82.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.82.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.83.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.83.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.83.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.83.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.83.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.84.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.84.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.84.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.84.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.84.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.85.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.85.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.85.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.85.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.85.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.86.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.86.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.86.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.86.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.86.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.87.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.87.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.87.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.87.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.87.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.88.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.88.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.88.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.88.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.88.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.89.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.89.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.89.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.89.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.89.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.90.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.90.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.90.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.90.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.90.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.91.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.91.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.91.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.91.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.91.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.92.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.92.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.92.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.92.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.92.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.93.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.93.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.93.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.93.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.93.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.94.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.94.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.94.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.94.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.94.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.95.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.95.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.95.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.95.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.95.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.96.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.96.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.96.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.96.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.96.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.97.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.97.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.97.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.97.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.97.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.98.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.98.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.98.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.98.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.98.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.99.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.99.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.99.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.99.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.99.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.100.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.100.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.100.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.100.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.100.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.101.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.101.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.101.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.101.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.101.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.102.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.102.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.102.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.102.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.102.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.103.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.103.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.103.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.103.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.103.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.104.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.104.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.104.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.104.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.104.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.105.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.105.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.105.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.105.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.105.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.106.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.106.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.106.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.106.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.106.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.107.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.107.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.107.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.107.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.107.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.108.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.108.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.108.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.108.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.108.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.109.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.109.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.109.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.109.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.109.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.110.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.110.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.110.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.110.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.110.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.111.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.111.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.111.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.111.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.111.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.112.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.112.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.112.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.112.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.112.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.113.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.113.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.113.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.113.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.113.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.114.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.114.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.114.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.114.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.114.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.115.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.115.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.115.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.115.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.115.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.116.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.116.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.116.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.116.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.116.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.117.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.117.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.117.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.117.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.117.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.118.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.118.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.118.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.118.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.118.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.119.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.119.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.119.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.119.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.119.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.120.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.120.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.120.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.120.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.120.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.121.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.121.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.121.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.121.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.121.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.122.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.122.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.122.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.122.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.122.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.123.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.123.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.123.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.123.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.123.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.124.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.124.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.124.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.124.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.124.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.125.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.125.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.125.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.125.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.125.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.126.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.126.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.126.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.126.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.126.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.127.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.127.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.127.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.127.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.127.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.128.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.128.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.128.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.128.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.128.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.129.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.129.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.129.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.129.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.129.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.130.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.130.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.130.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.130.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.130.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.131.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.131.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.131.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.131.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.131.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.132.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.132.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.132.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.132.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.132.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.133.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.133.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.133.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.133.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.133.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.134.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.134.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.134.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.134.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.134.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.135.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.135.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.135.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.135.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.135.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.136.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.136.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.136.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.136.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.136.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.137.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.137.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.137.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.137.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.137.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.138.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.138.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.138.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.138.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.138.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.139.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.139.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.139.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.139.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.139.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.140.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.140.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.140.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.140.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.140.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.141.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.141.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.141.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.141.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.141.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.142.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.142.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.142.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.142.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.142.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.143.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.143.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.143.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.143.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.143.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.144.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.144.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.144.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.144.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.144.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.145.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.145.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.145.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.145.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.145.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.146.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.146.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.146.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.146.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.146.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.147.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.147.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.147.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.147.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.147.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.148.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.148.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.148.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.148.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.148.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.149.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.149.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.149.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.149.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.149.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.150.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.150.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.150.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.150.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.150.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.151.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.151.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.151.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.151.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.151.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.152.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.152.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.152.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.152.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.152.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.153.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.153.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.153.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.153.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.153.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.154.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.154.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.154.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.154.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.154.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.155.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.155.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.155.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.155.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.155.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.156.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.156.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.156.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.156.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.156.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.157.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.157.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.157.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.157.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.157.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.158.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.158.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.158.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.158.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.158.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.159.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.159.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.159.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.159.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.159.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.160.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.160.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.160.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.160.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.160.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.160.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.161.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.161.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.161.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.161.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.161.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.161.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.162.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.162.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.162.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.162.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.162.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.162.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.163.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.163.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.163.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.163.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.163.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.163.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.164.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.164.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.164.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.164.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.164.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.164.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.165.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.165.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.165.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.165.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.165.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.165.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.166.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.166.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.166.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.166.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.166.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.166.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.167.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.167.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.167.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.167.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.167.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.167.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.168.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.168.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.168.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.168.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.168.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.168.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.169.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.169.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.169.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.169.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.169.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.169.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.170.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.170.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.170.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.170.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.170.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.170.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.171.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.171.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.171.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.171.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.171.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.171.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.172.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.172.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.172.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.172.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.172.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.172.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.173.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.173.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.173.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.173.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.173.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.173.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.174.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.174.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.174.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.174.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.174.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.174.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.175.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.175.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.175.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.175.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.175.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.175.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.176.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.176.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.176.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.176.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.176.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.176.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.177.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.177.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.177.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.177.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.177.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.177.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.178.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.178.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.178.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.178.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.178.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.178.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.179.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.179.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.179.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.179.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.179.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.179.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.180.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.180.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.180.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.180.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.180.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.180.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.181.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.181.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.181.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.181.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.181.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.181.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.182.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.182.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.182.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.182.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.182.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.182.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.183.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.183.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.183.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.183.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.183.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.183.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.184.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.184.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.184.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.184.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.184.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.184.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.185.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.185.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.185.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.185.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.185.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.185.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.186.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.186.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.186.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.186.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.186.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.186.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.187.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.187.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.187.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.187.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.187.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.187.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.188.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.188.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.188.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.188.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.188.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.188.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.189.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.189.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.189.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.189.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.189.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.189.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.190.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.190.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.190.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.190.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.190.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.190.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.191.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.191.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.191.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.191.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.191.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.191.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.192.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.192.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.192.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.192.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.192.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.192.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.193.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.193.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.193.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.193.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.193.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.193.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.194.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.194.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.194.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.194.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.194.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.194.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.195.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.195.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.195.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.195.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.195.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.195.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.196.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.196.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.196.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.196.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.196.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.196.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.197.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.197.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.197.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.197.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.197.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.197.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.198.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.198.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.198.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.198.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.198.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.198.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.199.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.199.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.199.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.199.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.199.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.199.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.200.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.200.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.200.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.200.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.200.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.200.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.201.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.201.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.201.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.201.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.201.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.201.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.202.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.202.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.202.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.202.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.202.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.202.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.203.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.203.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.203.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.203.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.203.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.203.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.204.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.204.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.204.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.204.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.204.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.204.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.205.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.205.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.205.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.205.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.205.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.205.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.206.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.206.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.206.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.206.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.206.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.206.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.207.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.207.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.207.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.207.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.207.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.207.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.208.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.208.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.208.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.208.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.208.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.208.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.209.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.209.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.209.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.209.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.209.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.209.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.210.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.210.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.210.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.210.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.210.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.210.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.211.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.211.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.211.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.211.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.211.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.211.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.212.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.212.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.212.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.212.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.212.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.212.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.213.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.213.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.213.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.213.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.213.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.213.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.214.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.214.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.214.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.214.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.214.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.214.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.215.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.215.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.215.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.215.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.215.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.215.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.216.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.216.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.216.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.216.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.216.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.216.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.217.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.217.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.217.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.217.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.217.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.217.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.218.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.218.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.218.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.218.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.218.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.218.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.219.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.219.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.219.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.219.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.219.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.219.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.220.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.220.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.220.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.220.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.220.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.220.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.221.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.221.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.221.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.221.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.221.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.221.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.222.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.222.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.222.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.222.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.222.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.222.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.223.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.223.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.223.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.223.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.223.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.223.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.224.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.224.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.224.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.224.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.224.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.224.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.225.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.225.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.225.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.225.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.225.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.225.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.226.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.226.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.226.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.226.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.226.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.226.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.227.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.227.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.227.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.227.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.227.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.227.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.228.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.228.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.228.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.228.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.228.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.228.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.229.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.229.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.229.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.229.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.229.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.229.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.230.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.230.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.230.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.230.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.230.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.230.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.231.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.231.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.231.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.231.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.231.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.231.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.232.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.232.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.232.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.232.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.232.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.232.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.233.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.233.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.233.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.233.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.233.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.233.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.234.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.234.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.234.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.234.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.234.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.234.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.235.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.235.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.235.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.235.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.235.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.235.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.236.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.236.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.236.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.236.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.236.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.236.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.237.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.237.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.237.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.237.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.237.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.237.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.238.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.238.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.238.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.238.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.238.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.238.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.239.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.239.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.239.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.239.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.239.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.239.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.240.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.240.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.240.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.240.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.240.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.240.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.241.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.241.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.241.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.241.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.241.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.241.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.242.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.242.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.242.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.242.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.242.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.242.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.243.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.243.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.243.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.243.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.243.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.243.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.244.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.244.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.244.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.244.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.244.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.244.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.245.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.245.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.245.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.245.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.245.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.245.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.246.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.246.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.246.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.246.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.246.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.246.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.247.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.247.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.247.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.247.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.247.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.247.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.248.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.248.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.248.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.248.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.248.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.248.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.249.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.249.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.249.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.249.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.249.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.249.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.250.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.250.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.250.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.250.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.250.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.250.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.251.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.251.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.251.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.251.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.251.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.251.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.252.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.252.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.252.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.252.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.252.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.252.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.253.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.253.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.253.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.253.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.253.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.253.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.254.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.254.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.254.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.254.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.254.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.254.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.255.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.255.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.255.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.255.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.255.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.255.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.input_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.28.post_attention_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.q_a_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.q_a_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.q_a_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.q_b_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.q_b_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.kv_b_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.kv_b_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.o_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.o_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.gate.weight": "model-00073-of-000163.safetensors", "model.layers.29.mlp.gate.e_score_correction_bias": "model-00073-of-000163.safetensors", "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.shared_experts.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.shared_experts.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.0.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.0.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.0.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.0.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.0.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.1.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.1.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.1.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.1.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.1.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.2.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.2.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.2.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.2.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.2.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.3.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.3.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.3.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.3.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.3.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.4.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.4.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.4.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.4.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.4.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.5.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.5.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.5.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.5.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.5.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.6.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.6.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.6.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.6.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.6.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.7.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.7.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.7.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.7.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.7.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.8.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.8.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.8.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.8.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.8.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.9.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.9.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.9.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.9.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.9.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.10.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.10.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.10.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.10.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.10.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.11.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.11.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.11.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.11.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.11.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.12.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.12.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.12.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.12.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.12.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.13.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.13.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.13.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.13.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.13.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.14.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.14.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.14.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.14.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.14.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.15.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.15.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.15.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.15.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.15.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.16.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.16.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.16.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.16.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.16.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.17.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.17.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.17.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.17.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.17.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.18.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.18.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.18.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.18.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.18.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.19.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.19.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.19.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.19.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.19.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.20.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.20.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.20.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.20.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.20.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.21.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.21.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.21.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.21.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.21.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.22.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.22.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.22.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.22.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.22.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.23.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.23.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.23.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.23.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.23.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.24.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.24.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.24.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.24.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.24.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.25.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.25.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.25.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.25.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.25.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.26.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.26.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.26.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.26.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.26.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.27.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.27.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.27.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.27.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.27.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.28.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.28.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.28.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.28.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.28.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.29.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.29.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.29.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.29.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.29.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.30.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.30.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.30.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.30.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.30.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.31.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.31.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.31.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.31.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.31.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.32.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.32.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.32.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.32.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.32.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.33.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.33.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.33.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.33.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.33.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.34.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.34.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.34.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.34.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.34.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.35.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.35.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.35.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.35.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.35.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.36.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.36.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.36.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.36.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.36.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.37.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.37.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.37.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.37.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.37.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.38.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.38.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.38.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.38.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.38.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.39.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.39.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.39.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.39.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.39.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.40.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.40.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.40.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.40.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.40.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.41.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.41.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.41.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.41.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.41.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.42.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.42.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.42.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.42.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.42.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.43.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.43.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.43.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.43.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.43.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.44.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.44.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.44.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.44.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.44.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.45.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.45.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.45.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.45.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.45.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.46.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.46.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.46.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.46.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.46.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.47.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.47.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.47.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.47.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.47.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.48.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.48.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.48.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.48.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.48.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.49.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.49.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.49.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.49.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.49.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.50.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.50.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.50.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.50.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.50.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.51.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.51.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.51.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.51.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.51.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.52.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.52.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.52.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.52.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.52.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.53.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.53.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.53.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.53.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.53.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.54.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.54.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.54.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.54.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.54.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.55.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.55.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.55.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.55.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.55.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.56.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.56.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.56.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.56.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.56.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.57.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.57.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.57.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.57.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.57.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.58.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.58.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.58.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.58.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.58.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.59.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.59.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.59.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.59.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.59.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.60.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.60.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.60.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.60.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.60.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.61.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.61.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.61.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.61.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.61.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.62.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.62.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.62.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.62.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.62.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.63.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.63.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.63.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.63.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.63.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.64.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.64.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.64.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.64.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.64.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.65.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.65.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.65.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.65.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.65.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.66.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.66.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.66.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.66.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.66.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.67.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.67.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.67.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.67.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.67.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.68.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.68.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.68.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.68.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.68.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.69.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.69.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.69.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.69.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.69.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.70.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.70.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.70.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.70.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.70.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.71.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.71.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.71.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.71.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.71.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.72.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.72.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.72.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.72.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.72.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.73.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.73.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.73.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.73.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.73.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.74.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.74.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.74.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.74.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.74.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.75.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.75.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.75.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.75.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.75.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.76.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.76.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.76.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.76.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.76.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.77.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.77.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.77.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.77.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.77.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.78.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.78.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.78.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.78.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.78.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.79.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.79.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.79.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.79.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.79.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.80.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.80.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.80.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.80.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.80.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.81.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.81.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.81.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.81.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.81.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.82.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.82.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.82.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.82.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.82.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.83.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.83.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.83.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.83.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.83.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.84.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.84.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.84.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.84.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.84.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.85.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.85.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.85.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.85.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.85.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.86.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.86.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.86.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.86.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.86.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.87.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.87.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.87.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.87.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.87.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.88.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.88.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.88.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.88.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.88.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.89.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.89.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.89.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.89.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.89.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.90.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.90.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.90.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.90.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.90.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.91.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.91.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.91.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.91.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.91.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.92.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.92.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.92.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.92.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.92.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.93.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.93.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.93.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.93.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.93.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.94.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.94.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.94.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.94.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.94.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.95.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.95.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.95.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.95.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.95.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.96.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.96.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.96.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.96.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.96.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.97.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.97.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.97.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.97.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.97.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.98.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.98.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.98.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.98.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.98.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.99.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.99.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.99.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.99.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.99.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.100.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.100.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.100.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.100.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.100.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.101.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.101.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.101.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.101.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.101.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.102.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.102.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.102.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.102.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.102.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.103.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.103.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.103.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.103.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.103.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.104.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.104.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.104.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.104.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.104.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.105.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.105.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.105.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.105.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.105.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.106.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.106.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.106.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.106.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.106.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.107.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.107.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.107.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.107.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.107.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.108.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.108.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.108.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.108.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.108.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.109.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.109.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.109.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.109.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.109.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.110.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.110.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.110.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.110.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.110.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.111.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.111.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.111.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.111.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.111.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.112.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.112.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.112.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.112.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.112.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.113.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.113.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.113.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.113.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.113.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.114.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.114.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.114.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.114.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.114.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.115.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.115.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.115.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.115.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.115.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.116.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.116.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.116.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.116.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.116.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.117.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.117.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.117.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.117.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.117.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.118.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.118.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.118.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.118.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.118.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.119.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.119.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.119.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.119.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.119.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.120.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.120.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.120.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.120.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.120.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.121.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.121.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.121.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.121.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.121.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.122.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.122.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.122.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.122.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.122.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.123.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.123.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.123.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.123.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.123.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.124.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.124.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.124.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.124.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.124.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.125.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.125.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.125.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.125.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.125.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.126.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.126.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.126.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.126.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.126.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.127.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.127.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.127.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.127.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.127.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.128.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.128.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.128.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.128.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.128.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.129.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.129.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.129.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.129.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.129.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.130.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.130.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.130.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.130.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.130.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.131.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.131.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.131.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.131.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.131.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.132.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.132.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.132.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.132.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.132.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.133.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.133.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.133.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.133.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.133.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.134.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.134.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.134.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.134.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.134.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.135.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.135.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.135.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.135.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.135.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.136.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.136.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.136.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.136.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.136.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.137.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.137.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.137.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.137.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.137.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.138.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.138.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.138.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.138.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.138.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.139.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.139.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.139.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.139.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.139.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.140.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.140.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.140.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.140.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.140.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.141.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.141.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.141.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.141.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.141.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.142.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.142.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.142.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.142.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.142.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.143.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.143.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.143.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.143.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.143.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.144.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.144.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.144.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.144.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.144.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.145.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.145.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.145.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.145.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.145.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.146.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.146.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.146.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.146.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.146.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.147.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.147.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.147.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.147.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.147.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.148.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.148.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.148.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.148.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.148.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.149.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.149.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.149.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.149.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.149.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.150.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.150.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.150.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.150.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.150.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.151.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.151.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.151.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.151.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.151.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.152.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.152.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.152.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.152.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.152.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.153.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.153.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.153.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.153.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.153.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.154.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.154.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.154.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.154.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.154.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.155.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.155.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.155.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.155.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.155.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.156.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.156.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.156.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.156.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.156.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.157.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.157.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.157.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.157.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.157.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.158.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.158.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.158.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.158.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.158.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.159.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.159.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.159.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.159.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.159.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.160.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.160.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.160.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.160.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.160.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.160.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.161.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.161.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.161.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.161.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.161.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.161.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.162.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.162.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.162.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.162.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.162.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.162.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.163.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.163.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.163.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.163.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.163.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.163.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.164.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.164.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.164.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.164.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.164.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.164.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.165.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.165.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.165.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.165.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.165.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.165.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.166.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.166.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.166.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.166.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.166.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.166.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.167.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.167.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.167.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.167.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.167.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.167.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.168.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.168.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.168.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.168.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.168.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.168.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.169.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.169.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.169.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.169.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.169.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.169.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.170.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.170.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.170.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.170.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.170.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.170.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.171.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.171.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.171.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.171.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.171.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.171.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.172.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.172.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.172.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.172.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.172.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.172.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.173.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.173.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.173.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.173.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.173.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.173.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.174.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.174.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.174.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.174.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.174.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.174.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.175.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.175.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.175.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.175.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.175.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.175.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.176.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.176.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.176.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.176.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.176.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.176.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.177.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.177.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.177.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.177.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.177.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.177.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.178.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.178.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.178.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.178.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.178.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.178.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.179.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.179.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.179.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.179.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.179.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.179.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.180.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.180.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.180.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.180.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.180.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.180.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.181.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.181.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.181.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.181.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.181.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.181.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.182.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.182.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.182.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.182.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.182.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.182.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.183.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.183.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.183.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.183.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.183.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.183.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.184.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.184.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.184.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.184.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.184.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.184.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.185.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.185.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.185.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.185.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.185.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.185.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.186.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.186.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.186.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.186.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.186.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.186.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.187.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.187.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.187.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.187.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.187.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.187.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.188.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.188.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.188.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.188.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.188.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.188.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.189.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.189.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.189.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.189.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.189.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.189.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.190.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.190.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.190.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.190.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.190.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.190.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.191.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.191.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.191.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.191.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.191.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.191.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.192.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.192.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.192.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.192.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.192.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.192.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.193.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.193.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.193.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.193.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.193.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.193.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.194.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.194.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.194.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.194.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.194.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.194.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.195.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.195.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.195.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.195.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.195.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.195.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.196.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.196.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.196.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.196.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.196.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.196.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.197.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.197.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.197.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.197.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.197.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.197.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.198.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.198.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.198.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.198.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.198.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.198.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.199.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.199.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.199.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.199.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.199.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.199.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.200.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.200.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.200.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.200.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.200.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.200.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.201.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.201.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.201.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.201.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.201.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.201.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.202.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.202.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.202.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.202.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.202.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.202.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.203.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.203.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.203.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.203.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.203.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.203.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.204.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.204.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.204.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.204.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.204.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.204.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.205.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.205.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.205.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.205.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.205.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.205.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.206.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.206.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.206.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.206.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.206.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.206.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.207.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.207.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.207.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.207.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.207.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.207.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.208.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.208.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.208.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.208.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.208.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.208.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.209.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.209.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.209.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.209.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.209.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.209.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.210.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.210.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.210.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.210.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.210.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.210.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.211.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.211.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.211.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.211.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.211.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.211.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.212.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.212.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.212.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.212.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.212.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.212.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.213.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.213.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.213.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.213.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.213.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.213.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.214.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.214.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.214.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.214.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.214.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.214.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.215.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.215.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.215.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.215.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.215.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.215.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.216.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.216.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.216.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.216.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.216.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.216.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.217.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.217.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.217.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.217.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.217.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.217.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.218.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.218.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.218.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.218.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.218.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.218.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.219.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.219.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.219.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.219.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.219.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.219.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.220.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.220.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.220.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.220.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.220.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.220.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.221.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.221.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.221.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.221.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.221.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.221.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.222.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.222.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.222.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.222.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.222.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.222.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.223.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.223.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.223.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.223.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.223.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.223.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.224.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.224.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.224.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.224.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.224.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.224.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.225.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.225.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.225.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.225.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.225.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.225.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.226.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.226.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.226.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.226.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.226.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.226.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.227.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.227.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.227.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.227.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.227.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.227.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.228.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.228.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.228.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.228.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.228.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.228.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.229.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.229.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.229.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.229.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.229.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.229.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.230.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.230.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.230.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.230.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.230.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.230.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.231.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.231.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.231.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.231.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.231.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.231.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.232.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.232.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.232.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.232.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.232.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.232.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.233.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.233.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.233.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.233.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.233.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.233.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.234.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.234.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.234.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.234.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.234.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.234.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.235.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.235.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.235.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.235.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.235.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.235.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.236.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.236.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.236.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.236.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.236.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.236.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.237.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.237.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.237.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.237.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.237.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.237.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.238.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.238.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.238.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.238.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.238.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.238.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.239.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.239.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.239.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.239.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.239.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.239.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.240.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.240.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.240.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.240.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.240.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.240.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.241.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.241.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.241.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.241.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.241.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.241.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.242.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.242.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.242.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.242.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.242.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.242.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.243.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.243.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.243.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.243.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.243.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.243.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.244.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.244.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.244.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.244.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.244.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.244.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.245.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.245.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.245.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.245.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.245.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.245.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.246.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.246.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.246.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.246.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.246.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.246.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.247.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.247.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.247.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.247.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.247.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.247.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.248.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.248.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.248.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.248.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.248.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.248.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.249.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.249.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.249.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.249.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.249.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.249.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.250.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.250.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.250.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.250.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.250.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.250.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.251.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.251.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.251.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.251.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.251.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.251.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.252.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.252.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.252.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.252.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.252.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.252.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.253.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.253.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.253.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.253.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.253.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.253.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.254.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.254.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.254.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.254.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.254.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.254.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.255.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.255.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.255.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.255.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.255.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.255.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.input_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.29.post_attention_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.q_a_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.q_a_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.q_a_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.q_b_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.q_b_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.kv_b_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.kv_b_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.o_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.o_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.gate.weight": "model-00075-of-000163.safetensors", "model.layers.30.mlp.gate.e_score_correction_bias": "model-00075-of-000163.safetensors", "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.shared_experts.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.shared_experts.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.0.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.0.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.0.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.0.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.0.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.1.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.1.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.1.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.1.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.1.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.2.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.2.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.2.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.2.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.2.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.3.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.3.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.3.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.3.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.3.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.4.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.4.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.4.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.4.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.4.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.5.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.5.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.5.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.5.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.5.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.6.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.6.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.6.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.6.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.6.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.7.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.7.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.7.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.7.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.7.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.8.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.8.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.8.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.8.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.8.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.9.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.9.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.9.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.9.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.9.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.10.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.10.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.10.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.10.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.10.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.11.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.11.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.11.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.11.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.11.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.12.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.12.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.12.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.12.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.12.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.13.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.13.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.13.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.13.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.13.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.14.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.14.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.14.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.14.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.14.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.15.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.15.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.15.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.15.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.15.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.16.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.16.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.16.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.16.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.16.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.17.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.17.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.17.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.17.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.17.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.18.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.18.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.18.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.18.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.18.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.19.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.19.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.19.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.19.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.19.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.20.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.20.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.20.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.20.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.20.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.21.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.21.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.21.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.21.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.21.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.22.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.22.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.22.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.22.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.22.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.23.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.23.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.23.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.23.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.23.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.24.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.24.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.24.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.24.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.24.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.25.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.25.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.25.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.25.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.25.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.26.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.26.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.26.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.26.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.26.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.27.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.27.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.27.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.27.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.27.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.28.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.28.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.28.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.28.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.28.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.29.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.29.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.29.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.29.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.29.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.30.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.30.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.30.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.30.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.30.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.31.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.31.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.31.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.31.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.31.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.32.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.32.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.32.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.32.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.32.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.33.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.33.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.33.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.33.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.33.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.34.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.34.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.34.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.34.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.34.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.35.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.35.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.35.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.35.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.35.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.36.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.36.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.36.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.36.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.36.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.37.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.37.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.37.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.37.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.37.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.38.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.38.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.38.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.38.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.38.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.39.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.39.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.39.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.39.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.39.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.40.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.40.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.40.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.40.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.40.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.41.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.41.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.41.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.41.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.41.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.42.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.42.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.42.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.42.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.42.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.43.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.43.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.43.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.43.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.43.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.44.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.44.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.44.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.44.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.44.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.45.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.45.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.45.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.45.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.45.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.46.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.46.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.46.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.46.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.46.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.47.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.47.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.47.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.47.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.47.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.48.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.48.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.48.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.48.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.48.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.49.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.49.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.49.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.49.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.49.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.50.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.50.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.50.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.50.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.50.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.51.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.51.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.51.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.51.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.51.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.52.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.52.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.52.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.52.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.52.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.53.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.53.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.53.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.53.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.53.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.54.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.54.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.54.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.54.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.54.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.55.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.55.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.55.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.55.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.55.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.56.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.56.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.56.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.56.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.56.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.57.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.57.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.57.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.57.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.57.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.58.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.58.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.58.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.58.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.58.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.59.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.59.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.59.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.59.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.59.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.60.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.60.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.60.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.60.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.60.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.61.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.61.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.61.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.61.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.61.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.62.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.62.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.62.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.62.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.62.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.63.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.63.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.63.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.63.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.63.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.64.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.64.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.64.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.64.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.64.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.65.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.65.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.65.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.65.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.65.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.66.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.66.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.66.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.66.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.66.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.67.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.67.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.67.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.67.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.67.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.68.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.68.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.68.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.68.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.68.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.69.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.69.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.69.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.69.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.69.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.70.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.70.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.70.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.70.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.70.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.71.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.71.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.71.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.71.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.71.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.72.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.72.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.72.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.72.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.72.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.73.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.73.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.73.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.73.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.73.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.74.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.74.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.74.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.74.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.74.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.75.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.75.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.75.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.75.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.75.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.76.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.76.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.76.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.76.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.76.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.77.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.77.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.77.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.77.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.77.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.78.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.78.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.78.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.78.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.78.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.79.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.79.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.79.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.79.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.79.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.80.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.80.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.80.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.80.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.80.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.81.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.81.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.81.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.81.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.81.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.82.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.82.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.82.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.82.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.82.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.83.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.83.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.83.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.83.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.83.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.84.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.84.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.84.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.84.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.84.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.85.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.85.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.85.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.85.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.85.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.86.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.86.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.86.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.86.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.86.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.87.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.87.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.87.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.87.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.87.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.88.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.88.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.88.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.88.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.88.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.89.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.89.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.89.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.89.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.89.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.90.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.90.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.90.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.90.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.90.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.91.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.91.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.91.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.91.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.91.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.92.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.92.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.92.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.92.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.92.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.93.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.93.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.93.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.93.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.93.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.94.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.94.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.94.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.94.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.94.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.95.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.95.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.95.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.95.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.95.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.96.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.96.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.96.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.96.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.96.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.97.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.97.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.97.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.97.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.97.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.98.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.98.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.98.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.98.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.98.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.99.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.99.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.99.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.99.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.99.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.100.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.100.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.100.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.100.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.100.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.101.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.101.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.101.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.101.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.101.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.102.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.102.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.102.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.102.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.102.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.103.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.103.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.103.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.103.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.103.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.104.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.104.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.104.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.104.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.104.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.105.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.105.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.105.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.105.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.105.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.106.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.106.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.106.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.106.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.106.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.107.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.107.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.107.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.107.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.107.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.108.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.108.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.108.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.108.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.108.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.109.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.109.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.109.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.109.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.109.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.110.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.110.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.110.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.110.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.110.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.111.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.111.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.111.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.111.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.111.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.112.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.112.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.112.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.112.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.112.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.113.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.113.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.113.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.113.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.113.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.114.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.114.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.114.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.114.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.114.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.115.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.115.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.115.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.115.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.115.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.116.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.116.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.116.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.116.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.116.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.117.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.117.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.117.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.117.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.117.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.118.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.118.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.118.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.118.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.118.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.119.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.119.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.119.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.119.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.119.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.120.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.120.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.120.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.120.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.120.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.121.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.121.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.121.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.121.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.121.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.122.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.122.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.122.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.122.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.122.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.123.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.123.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.123.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.123.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.123.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.124.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.124.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.124.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.124.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.124.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.125.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.125.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.125.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.125.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.125.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.126.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.126.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.126.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.126.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.126.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.127.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.127.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.127.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.127.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.127.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.128.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.128.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.128.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.128.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.128.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.129.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.129.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.129.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.129.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.129.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.130.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.130.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.130.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.130.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.130.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.131.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.131.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.131.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.131.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.131.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.132.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.132.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.132.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.132.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.132.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.133.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.133.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.133.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.133.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.133.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.134.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.134.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.134.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.134.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.134.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.135.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.135.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.135.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.135.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.135.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.136.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.136.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.136.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.136.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.136.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.137.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.137.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.137.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.137.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.137.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.138.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.138.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.138.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.138.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.138.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.139.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.139.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.139.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.139.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.139.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.140.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.140.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.140.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.140.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.140.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.141.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.141.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.141.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.141.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.141.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.142.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.142.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.142.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.142.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.142.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.143.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.143.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.143.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.143.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.143.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.144.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.144.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.144.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.144.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.144.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.145.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.145.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.145.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.145.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.145.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.146.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.146.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.146.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.146.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.146.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.147.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.147.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.147.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.147.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.147.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.148.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.148.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.148.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.148.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.148.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.149.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.149.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.149.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.149.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.149.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.150.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.150.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.150.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.150.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.150.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.151.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.151.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.151.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.151.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.151.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.152.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.152.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.152.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.152.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.152.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.153.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.153.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.153.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.153.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.153.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.154.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.154.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.154.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.154.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.154.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.155.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.155.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.155.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.155.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.155.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.156.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.156.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.156.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.156.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.156.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.157.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.157.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.157.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.157.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.157.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.158.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.158.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.158.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.158.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.158.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.159.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.159.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.159.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.159.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.159.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.160.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.160.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.160.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.160.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.160.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.160.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.161.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.161.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.161.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.161.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.161.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.161.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.162.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.162.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.162.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.162.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.162.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.162.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.163.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.163.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.163.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.163.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.163.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.163.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.164.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.164.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.164.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.164.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.164.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.164.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.165.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.165.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.165.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.165.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.165.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.165.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.166.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.166.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.166.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.166.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.166.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.166.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.167.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.167.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.167.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.167.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.167.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.167.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.168.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.168.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.168.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.168.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.168.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.168.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.169.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.169.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.169.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.169.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.169.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.169.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.170.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.170.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.170.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.170.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.170.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.170.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.171.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.171.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.171.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.171.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.171.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.171.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.172.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.172.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.172.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.172.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.172.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.172.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.173.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.173.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.173.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.173.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.173.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.173.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.174.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.174.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.174.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.174.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.174.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.174.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.175.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.175.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.175.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.175.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.175.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.175.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.176.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.176.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.176.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.176.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.176.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.176.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.177.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.177.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.177.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.177.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.177.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.177.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.178.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.178.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.178.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.178.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.178.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.178.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.179.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.179.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.179.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.179.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.179.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.179.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.180.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.180.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.180.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.180.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.180.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.180.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.181.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.181.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.181.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.181.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.181.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.181.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.182.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.182.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.182.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.182.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.182.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.182.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.183.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.183.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.183.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.183.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.183.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.183.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.184.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.184.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.184.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.184.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.184.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.184.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.185.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.185.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.185.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.185.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.185.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.185.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.186.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.186.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.186.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.186.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.186.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.186.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.187.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.187.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.187.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.187.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.187.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.187.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.188.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.188.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.188.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.188.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.188.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.188.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.189.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.189.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.189.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.189.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.189.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.189.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.190.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.190.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.190.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.190.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.190.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.190.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.191.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.191.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.191.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.191.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.191.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.191.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.192.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.192.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.192.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.192.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.192.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.192.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.193.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.193.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.193.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.193.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.193.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.193.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.194.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.194.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.194.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.194.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.194.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.194.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.195.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.195.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.195.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.195.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.195.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.195.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.196.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.196.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.196.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.196.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.196.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.196.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.197.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.197.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.197.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.197.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.197.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.197.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.198.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.198.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.198.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.198.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.198.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.198.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.199.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.199.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.199.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.199.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.199.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.199.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.200.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.200.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.200.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.200.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.200.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.200.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.201.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.201.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.201.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.201.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.201.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.201.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.202.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.202.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.202.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.202.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.202.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.202.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.203.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.203.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.203.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.203.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.203.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.203.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.204.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.204.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.204.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.204.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.204.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.204.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.205.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.205.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.205.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.205.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.205.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.205.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.206.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.206.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.206.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.206.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.206.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.206.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.207.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.207.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.207.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.207.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.207.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.207.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.208.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.208.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.208.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.208.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.208.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.208.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.209.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.209.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.209.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.209.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.209.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.209.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.210.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.210.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.210.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.210.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.210.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.210.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.211.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.211.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.211.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.211.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.211.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.211.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.212.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.212.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.212.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.212.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.212.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.212.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.213.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.213.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.213.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.213.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.213.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.213.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.214.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.214.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.214.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.214.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.214.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.214.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.215.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.215.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.215.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.215.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.215.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.215.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.216.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.216.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.216.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.216.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.216.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.216.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.217.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.217.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.217.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.217.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.217.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.217.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.218.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.218.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.218.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.218.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.218.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.218.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.219.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.219.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.219.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.219.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.219.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.219.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.220.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.220.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.220.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.220.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.220.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.220.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.221.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.221.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.221.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.221.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.221.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.221.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.222.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.222.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.222.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.222.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.222.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.222.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.223.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.223.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.223.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.223.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.223.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.223.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.224.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.224.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.224.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.224.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.224.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.224.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.225.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.225.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.225.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.225.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.225.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.225.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.226.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.226.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.226.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.226.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.226.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.226.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.227.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.227.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.227.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.227.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.227.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.227.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.228.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.228.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.228.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.228.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.228.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.228.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.229.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.229.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.229.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.229.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.229.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.229.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.230.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.230.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.230.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.230.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.230.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.230.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.231.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.231.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.231.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.231.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.231.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.231.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.232.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.232.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.232.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.232.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.232.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.232.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.233.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.233.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.233.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.233.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.233.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.233.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.234.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.234.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.234.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.234.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.234.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.234.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.235.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.235.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.235.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.235.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.235.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.235.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.236.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.236.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.236.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.236.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.236.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.236.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.237.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.237.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.237.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.237.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.237.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.237.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.238.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.238.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.238.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.238.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.238.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.238.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.239.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.239.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.239.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.239.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.239.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.239.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.240.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.240.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.240.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.240.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.240.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.240.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.241.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.241.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.241.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.241.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.241.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.241.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.242.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.242.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.242.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.242.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.242.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.242.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.243.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.243.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.243.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.243.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.243.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.243.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.244.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.244.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.244.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.244.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.244.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.244.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.245.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.245.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.245.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.245.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.245.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.245.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.246.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.246.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.246.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.246.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.246.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.246.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.247.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.247.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.247.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.247.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.247.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.247.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.248.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.248.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.248.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.248.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.248.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.248.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.249.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.249.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.249.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.249.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.249.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.249.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.250.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.250.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.250.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.250.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.250.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.250.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.251.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.251.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.251.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.251.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.251.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.251.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.252.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.252.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.252.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.252.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.252.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.252.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.253.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.253.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.253.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.253.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.253.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.253.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.254.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.254.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.254.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.254.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.254.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.254.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.255.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.255.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.255.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.255.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.255.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.255.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.input_layernorm.weight": "model-00078-of-000163.safetensors", "model.layers.30.post_attention_layernorm.weight": "model-00078-of-000163.safetensors", "model.layers.31.self_attn.q_a_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.q_a_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.q_a_layernorm.weight": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.q_b_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.q_b_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.kv_b_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.kv_b_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.o_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.o_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.gate.weight": "model-00079-of-000163.safetensors", "model.layers.31.mlp.gate.e_score_correction_bias": "model-00079-of-000163.safetensors", "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.shared_experts.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.shared_experts.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.0.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.0.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.0.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.0.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.0.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.1.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.1.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.1.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.1.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.1.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.2.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.2.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.2.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.2.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.2.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.3.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.3.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.3.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.3.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.3.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.4.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.4.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.4.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.4.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.4.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.5.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.5.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.5.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.5.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.5.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.6.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.6.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.6.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.6.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.6.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.7.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.7.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.7.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.7.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.7.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.8.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.8.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.8.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.8.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.8.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.9.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.9.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.9.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.9.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.9.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.10.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.10.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.10.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.10.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.10.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.11.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.11.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.11.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.11.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.11.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.12.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.12.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.12.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.12.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.12.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.13.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.13.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.13.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.13.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.13.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.14.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.14.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.14.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.14.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.14.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.15.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.15.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.15.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.15.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.15.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.16.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.16.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.16.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.16.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.16.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.17.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.17.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.17.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.17.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.17.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.18.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.18.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.18.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.18.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.18.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.19.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.19.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.19.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.19.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.19.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.20.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.20.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.20.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.20.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.20.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.21.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.21.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.21.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.21.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.21.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.22.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.22.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.22.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.22.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.22.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.23.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.23.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.23.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.23.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.23.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.24.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.24.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.24.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.24.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.24.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.25.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.25.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.25.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.25.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.25.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.26.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.26.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.26.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.26.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.26.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.27.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.27.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.27.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.27.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.27.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.28.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.28.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.28.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.28.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.28.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.29.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.29.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.29.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.29.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.29.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.30.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.30.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.30.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.30.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.30.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.31.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.31.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.31.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.31.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.31.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.32.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.32.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.32.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.32.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.32.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.33.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.33.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.33.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.33.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.33.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.34.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.34.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.34.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.34.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.34.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.35.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.35.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.35.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.35.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.35.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.36.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.36.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.36.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.36.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.36.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.37.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.37.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.37.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.37.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.37.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.38.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.38.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.38.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.38.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.38.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.39.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.39.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.39.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.39.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.39.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.40.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.40.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.40.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.40.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.40.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.41.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.41.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.41.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.41.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.41.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.42.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.42.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.42.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.42.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.42.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.43.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.43.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.43.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.43.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.43.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.44.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.44.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.44.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.44.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.44.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.45.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.45.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.45.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.45.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.45.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.46.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.46.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.46.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.46.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.46.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.47.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.47.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.47.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.47.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.47.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.48.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.48.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.48.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.48.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.48.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.49.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.49.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.49.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.49.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.49.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.50.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.50.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.50.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.50.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.50.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.51.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.51.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.51.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.51.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.51.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.52.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.52.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.52.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.52.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.52.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.53.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.53.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.53.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.53.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.53.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.54.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.54.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.54.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.54.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.54.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.55.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.55.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.55.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.55.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.55.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.56.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.56.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.56.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.56.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.56.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.57.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.57.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.57.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.57.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.57.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.58.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.58.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.58.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.58.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.58.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.59.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.59.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.59.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.59.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.59.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.60.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.60.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.60.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.60.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.60.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.61.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.61.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.61.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.61.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.61.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.62.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.62.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.62.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.62.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.62.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.63.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.63.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.63.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.63.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.63.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.64.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.64.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.64.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.64.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.64.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.65.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.65.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.65.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.65.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.65.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.66.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.66.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.66.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.66.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.66.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.67.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.67.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.67.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.67.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.67.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.68.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.68.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.68.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.68.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.68.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.69.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.69.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.69.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.69.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.69.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.70.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.70.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.70.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.70.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.70.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.71.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.71.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.71.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.71.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.71.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.72.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.72.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.72.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.72.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.72.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.73.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.73.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.73.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.73.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.73.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.74.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.74.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.74.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.74.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.74.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.75.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.75.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.75.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.75.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.75.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.76.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.76.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.76.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.76.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.76.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.77.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.77.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.77.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.77.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.77.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.78.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.78.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.78.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.78.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.78.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.79.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.79.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.79.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.79.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.79.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.80.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.80.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.80.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.80.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.80.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.81.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.81.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.81.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.81.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.81.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.82.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.82.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.82.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.82.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.82.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.83.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.83.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.83.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.83.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.83.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.84.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.84.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.84.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.84.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.84.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.85.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.85.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.85.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.85.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.85.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.86.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.86.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.86.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.86.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.86.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.87.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.87.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.87.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.87.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.87.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.88.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.88.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.88.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.88.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.88.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.89.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.89.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.89.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.89.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.89.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.90.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.90.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.90.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.90.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.90.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.91.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.91.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.91.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.91.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.91.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.92.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.92.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.92.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.92.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.92.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.93.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.93.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.93.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.93.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.93.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.94.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.94.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.94.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.94.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.94.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.95.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.95.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.95.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.95.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.95.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.96.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.96.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.96.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.96.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.96.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.97.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.97.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.97.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.97.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.97.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.98.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.98.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.98.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.98.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.98.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.99.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.99.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.99.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.99.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.99.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.100.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.100.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.100.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.100.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.100.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.101.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.101.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.101.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.101.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.101.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.102.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.102.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.102.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.102.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.102.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.103.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.103.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.103.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.103.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.103.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.104.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.104.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.104.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.104.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.104.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.105.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.105.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.105.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.105.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.105.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.106.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.106.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.106.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.106.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.106.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.107.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.107.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.107.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.107.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.107.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.108.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.108.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.108.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.108.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.108.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.109.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.109.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.109.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.109.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.109.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.110.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.110.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.110.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.110.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.110.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.111.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.111.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.111.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.111.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.111.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.112.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.112.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.112.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.112.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.112.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.113.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.113.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.113.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.113.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.113.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.114.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.114.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.114.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.114.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.114.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.115.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.115.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.115.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.115.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.115.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.116.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.116.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.116.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.116.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.116.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.117.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.117.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.117.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.117.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.117.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.118.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.118.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.118.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.118.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.118.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.119.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.119.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.119.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.119.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.119.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.120.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.120.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.120.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.120.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.120.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.121.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.121.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.121.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.121.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.121.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.122.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.122.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.122.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.122.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.122.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.123.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.123.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.123.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.123.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.123.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.124.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.124.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.124.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.124.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.124.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.125.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.125.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.125.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.125.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.125.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.126.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.126.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.126.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.126.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.126.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.127.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.127.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.127.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.127.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.127.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.128.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.128.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.128.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.128.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.128.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.129.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.129.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.129.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.129.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.129.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.130.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.130.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.130.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.130.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.130.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.131.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.131.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.131.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.131.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.131.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.132.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.132.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.132.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.132.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.132.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.133.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.133.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.133.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.133.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.133.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.134.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.134.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.134.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.134.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.134.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.135.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.135.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.135.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.135.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.135.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.136.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.136.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.136.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.136.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.136.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.137.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.137.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.137.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.137.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.137.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.138.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.138.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.138.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.138.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.138.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.139.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.139.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.139.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.139.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.139.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.140.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.140.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.140.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.140.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.140.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.141.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.141.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.141.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.141.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.141.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.142.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.142.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.142.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.142.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.142.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.143.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.143.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.143.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.143.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.143.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.144.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.144.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.144.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.144.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.144.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.145.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.145.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.145.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.145.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.145.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.146.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.146.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.146.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.146.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.146.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.147.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.147.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.147.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.147.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.147.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.148.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.148.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.148.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.148.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.148.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.149.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.149.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.149.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.149.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.149.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.150.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.150.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.150.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.150.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.150.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.151.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.151.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.151.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.151.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.151.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.152.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.152.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.152.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.152.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.152.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.153.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.153.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.153.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.153.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.153.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.154.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.154.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.154.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.154.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.154.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.155.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.155.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.155.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.155.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.155.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.156.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.156.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.156.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.156.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.156.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.157.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.157.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.157.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.157.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.157.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.158.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.158.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.158.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.158.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.158.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.159.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.159.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.159.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.159.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.159.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.160.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.160.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.160.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.160.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.160.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.160.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.161.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.161.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.161.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.161.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.161.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.161.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.162.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.162.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.162.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.162.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.162.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.162.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.163.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.163.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.163.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.163.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.163.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.163.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.164.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.164.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.164.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.164.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.164.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.164.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.165.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.165.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.165.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.165.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.165.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.165.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.166.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.166.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.166.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.166.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.166.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.166.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.167.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.167.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.167.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.167.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.167.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.167.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.168.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.168.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.168.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.168.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.168.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.168.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.169.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.169.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.169.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.169.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.169.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.169.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.170.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.170.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.170.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.170.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.170.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.170.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.171.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.171.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.171.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.171.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.171.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.171.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.172.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.172.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.172.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.172.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.172.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.172.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.173.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.173.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.173.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.173.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.173.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.173.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.174.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.174.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.174.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.174.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.174.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.174.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.175.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.175.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.175.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.175.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.175.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.175.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.176.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.176.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.176.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.176.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.176.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.176.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.177.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.177.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.177.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.177.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.177.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.177.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.178.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.178.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.178.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.178.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.178.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.178.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.179.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.179.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.179.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.179.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.179.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.179.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.180.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.180.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.180.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.180.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.180.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.180.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.181.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.181.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.181.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.181.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.181.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.181.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.182.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.182.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.182.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.182.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.182.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.182.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.183.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.183.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.183.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.183.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.183.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.183.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.184.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.184.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.184.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.184.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.184.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.184.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.185.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.185.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.185.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.185.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.185.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.185.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.186.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.186.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.186.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.186.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.186.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.186.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.187.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.187.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.187.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.187.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.187.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.187.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.188.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.188.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.188.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.188.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.188.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.188.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.189.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.189.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.189.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.189.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.189.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.189.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.190.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.190.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.190.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.190.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.190.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.190.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.191.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.191.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.191.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.191.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.191.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.191.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.192.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.192.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.192.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.192.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.192.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.192.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.193.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.193.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.193.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.193.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.193.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.193.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.194.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.194.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.194.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.194.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.194.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.194.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.195.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.195.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.195.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.195.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.195.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.195.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.196.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.196.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.196.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.196.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.196.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.196.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.197.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.197.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.197.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.197.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.197.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.197.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.198.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.198.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.198.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.198.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.198.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.198.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.199.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.199.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.199.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.199.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.199.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.199.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.200.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.200.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.200.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.200.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.200.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.200.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.201.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.201.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.201.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.201.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.201.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.201.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.202.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.202.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.202.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.202.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.202.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.202.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.203.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.203.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.203.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.203.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.203.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.203.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.204.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.204.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.204.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.204.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.204.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.204.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.205.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.205.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.205.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.205.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.205.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.205.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.206.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.206.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.206.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.206.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.206.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.206.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.207.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.207.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.207.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.207.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.207.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.207.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.208.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.208.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.208.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.208.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.208.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.208.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.209.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.209.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.209.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.209.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.209.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.209.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.210.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.210.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.210.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.210.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.210.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.210.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.211.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.211.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.211.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.211.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.211.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.211.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.212.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.212.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.212.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.212.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.212.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.212.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.213.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.213.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.213.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.213.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.213.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.213.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.214.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.214.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.214.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.214.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.214.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.214.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.215.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.215.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.215.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.215.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.215.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.215.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.216.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.216.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.216.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.216.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.216.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.216.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.217.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.217.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.217.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.217.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.217.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.217.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.218.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.218.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.218.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.218.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.218.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.218.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.219.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.219.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.219.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.219.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.219.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.219.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.220.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.220.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.220.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.220.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.220.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.220.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.221.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.221.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.221.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.221.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.221.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.221.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.222.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.222.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.222.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.222.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.222.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.222.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.223.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.223.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.223.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.223.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.223.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.223.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.224.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.224.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.224.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.224.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.224.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.224.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.225.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.225.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.225.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.225.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.225.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.225.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.226.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.226.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.226.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.226.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.226.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.226.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.227.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.227.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.227.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.227.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.227.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.227.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.228.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.228.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.228.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.228.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.228.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.228.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.229.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.229.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.229.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.229.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.229.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.229.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.230.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.230.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.230.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.230.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.230.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.230.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.231.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.231.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.231.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.231.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.231.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.231.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.232.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.232.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.232.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.232.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.232.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.232.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.233.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.233.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.233.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.233.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.233.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.233.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.234.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.234.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.234.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.234.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.234.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.234.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.235.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.235.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.235.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.235.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.235.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.235.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.236.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.236.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.236.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.236.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.236.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.236.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.237.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.237.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.237.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.237.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.237.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.237.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.238.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.238.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.238.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.238.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.238.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.238.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.239.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.239.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.239.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.239.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.239.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.239.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.240.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.240.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.240.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.240.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.240.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.240.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.241.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.241.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.241.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.241.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.241.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.241.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.242.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.242.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.242.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.242.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.242.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.242.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.243.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.243.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.243.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.243.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.243.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.243.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.244.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.244.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.244.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.244.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.244.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.244.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.245.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.245.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.245.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.245.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.245.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.245.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.246.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.246.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.246.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.246.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.246.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.246.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.247.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.247.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.247.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.247.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.247.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.247.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.248.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.248.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.248.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.248.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.248.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.248.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.249.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.249.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.249.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.249.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.249.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.249.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.250.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.250.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.250.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.250.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.250.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.250.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.251.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.251.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.251.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.251.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.251.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.251.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.252.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.252.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.252.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.252.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.252.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.252.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.253.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.253.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.253.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.253.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.253.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.253.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.254.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.254.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.254.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.254.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.254.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.254.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.255.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.255.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.255.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.255.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.255.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.255.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.input_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.31.post_attention_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.q_a_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.q_a_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.q_a_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.q_b_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.q_b_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.kv_b_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.kv_b_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.o_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.o_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.gate.weight": "model-00081-of-000163.safetensors", "model.layers.32.mlp.gate.e_score_correction_bias": "model-00081-of-000163.safetensors", "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.shared_experts.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.shared_experts.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.0.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.0.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.0.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.0.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.0.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.1.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.1.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.1.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.1.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.1.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.2.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.2.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.2.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.2.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.2.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.3.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.3.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.3.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.3.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.3.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.4.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.4.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.4.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.4.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.4.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.5.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.5.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.5.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.5.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.5.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.6.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.6.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.6.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.6.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.6.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.7.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.7.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.7.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.7.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.7.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.8.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.8.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.8.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.8.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.8.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.9.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.9.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.9.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.9.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.9.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.10.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.10.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.10.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.10.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.10.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.11.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.11.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.11.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.11.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.11.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.12.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.12.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.12.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.12.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.12.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.13.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.13.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.13.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.13.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.13.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.14.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.14.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.14.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.14.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.14.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.15.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.15.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.15.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.15.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.15.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.16.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.16.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.16.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.16.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.16.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.17.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.17.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.17.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.17.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.17.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.18.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.18.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.18.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.18.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.18.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.19.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.19.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.19.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.19.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.19.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.20.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.20.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.20.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.20.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.20.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.21.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.21.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.21.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.21.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.21.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.22.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.22.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.22.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.22.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.22.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.23.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.23.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.23.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.23.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.23.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.24.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.24.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.24.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.24.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.24.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.25.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.25.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.25.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.25.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.25.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.26.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.26.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.26.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.26.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.26.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.27.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.27.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.27.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.27.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.27.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.28.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.28.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.28.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.28.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.28.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.29.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.29.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.29.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.29.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.29.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.30.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.30.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.30.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.30.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.30.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.31.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.31.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.31.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.31.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.31.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.32.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.32.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.32.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.32.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.32.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.33.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.33.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.33.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.33.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.33.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.34.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.34.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.34.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.34.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.34.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.35.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.35.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.35.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.35.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.35.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.36.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.36.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.36.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.36.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.36.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.37.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.37.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.37.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.37.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.37.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.38.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.38.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.38.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.38.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.38.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.39.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.39.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.39.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.39.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.39.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.40.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.40.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.40.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.40.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.40.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.41.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.41.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.41.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.41.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.41.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.42.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.42.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.42.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.42.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.42.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.43.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.43.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.43.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.43.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.43.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.44.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.44.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.44.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.44.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.44.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.45.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.45.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.45.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.45.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.45.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.46.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.46.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.46.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.46.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.46.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.47.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.47.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.47.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.47.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.47.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.48.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.48.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.48.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.48.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.48.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.49.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.49.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.49.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.49.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.49.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.50.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.50.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.50.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.50.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.50.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.51.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.51.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.51.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.51.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.51.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.52.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.52.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.52.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.52.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.52.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.53.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.53.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.53.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.53.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.53.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.54.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.54.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.54.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.54.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.54.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.55.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.55.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.55.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.55.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.55.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.56.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.56.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.56.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.56.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.56.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.57.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.57.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.57.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.57.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.57.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.58.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.58.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.58.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.58.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.58.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.59.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.59.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.59.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.59.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.59.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.60.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.60.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.60.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.60.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.60.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.61.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.61.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.61.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.61.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.61.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.62.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.62.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.62.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.62.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.62.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.63.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.63.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.63.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.63.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.63.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.64.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.64.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.64.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.64.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.64.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.65.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.65.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.65.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.65.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.65.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.66.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.66.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.66.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.66.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.66.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.67.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.67.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.67.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.67.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.67.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.68.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.68.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.68.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.68.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.68.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.69.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.69.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.69.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.69.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.69.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.70.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.70.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.70.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.70.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.70.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.71.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.71.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.71.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.71.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.71.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.72.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.72.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.72.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.72.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.72.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.73.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.73.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.73.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.73.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.73.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.74.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.74.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.74.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.74.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.74.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.75.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.75.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.75.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.75.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.75.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.76.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.76.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.76.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.76.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.76.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.77.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.77.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.77.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.77.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.77.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.78.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.78.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.78.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.78.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.78.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.79.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.79.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.79.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.79.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.79.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.80.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.80.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.80.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.80.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.80.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.81.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.81.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.81.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.81.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.81.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.82.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.82.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.82.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.82.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.82.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.83.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.83.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.83.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.83.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.83.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.84.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.84.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.84.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.84.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.84.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.85.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.85.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.85.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.85.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.85.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.86.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.86.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.86.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.86.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.86.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.87.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.87.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.87.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.87.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.87.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.88.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.88.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.88.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.88.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.88.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.89.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.89.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.89.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.89.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.89.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.90.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.90.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.90.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.90.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.90.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.91.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.91.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.91.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.91.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.91.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.92.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.92.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.92.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.92.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.92.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.93.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.93.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.93.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.93.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.93.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.94.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.94.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.94.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.94.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.94.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.95.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.95.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.95.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.95.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.95.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.96.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.96.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.96.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.96.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.96.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.97.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.97.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.97.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.97.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.97.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.98.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.98.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.98.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.98.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.98.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.99.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.99.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.99.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.99.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.99.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.100.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.100.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.100.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.100.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.100.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.101.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.101.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.101.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.101.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.101.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.102.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.102.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.102.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.102.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.102.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.103.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.103.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.103.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.103.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.103.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.104.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.104.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.104.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.104.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.104.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.105.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.105.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.105.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.105.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.105.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.106.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.106.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.106.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.106.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.106.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.107.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.107.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.107.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.107.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.107.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.108.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.108.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.108.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.108.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.108.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.109.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.109.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.109.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.109.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.109.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.110.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.110.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.110.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.110.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.110.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.111.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.111.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.111.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.111.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.111.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.112.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.112.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.112.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.112.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.112.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.113.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.113.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.113.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.113.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.113.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.114.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.114.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.114.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.114.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.114.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.115.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.115.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.115.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.115.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.115.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.116.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.116.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.116.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.116.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.116.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.117.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.117.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.117.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.117.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.117.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.118.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.118.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.118.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.118.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.118.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.119.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.119.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.119.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.119.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.119.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.120.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.120.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.120.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.120.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.120.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.121.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.121.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.121.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.121.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.121.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.122.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.122.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.122.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.122.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.122.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.123.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.123.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.123.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.123.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.123.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.124.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.124.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.124.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.124.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.124.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.125.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.125.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.125.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.125.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.125.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.126.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.126.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.126.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.126.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.126.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.127.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.127.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.127.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.127.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.127.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.128.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.128.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.128.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.128.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.128.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.129.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.129.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.129.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.129.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.129.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.130.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.130.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.130.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.130.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.130.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.131.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.131.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.131.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.131.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.131.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.132.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.132.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.132.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.132.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.132.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.133.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.133.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.133.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.133.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.133.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.134.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.134.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.134.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.134.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.134.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.135.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.135.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.135.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.135.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.135.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.136.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.136.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.136.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.136.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.136.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.137.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.137.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.137.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.137.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.137.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.138.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.138.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.138.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.138.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.138.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.139.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.139.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.139.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.139.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.139.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.140.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.140.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.140.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.140.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.140.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.141.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.141.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.141.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.141.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.141.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.142.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.142.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.142.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.142.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.142.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.143.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.143.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.143.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.143.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.143.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.144.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.144.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.144.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.144.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.144.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.145.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.145.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.145.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.145.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.145.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.146.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.146.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.146.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.146.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.146.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.147.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.147.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.147.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.147.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.147.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.148.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.148.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.148.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.148.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.148.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.149.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.149.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.149.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.149.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.149.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.150.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.150.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.150.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.150.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.150.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.151.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.151.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.151.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.151.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.151.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.152.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.152.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.152.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.152.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.152.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.153.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.153.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.153.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.153.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.153.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.154.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.154.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.154.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.154.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.154.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.155.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.155.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.155.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.155.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.155.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.156.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.156.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.156.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.156.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.156.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.157.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.157.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.157.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.157.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.157.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.158.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.158.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.158.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.158.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.158.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.159.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.159.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.159.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.159.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.159.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.160.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.160.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.160.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.160.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.160.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.160.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.161.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.161.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.161.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.161.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.161.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.161.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.162.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.162.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.162.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.162.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.162.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.162.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.163.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.163.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.163.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.163.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.163.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.163.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.164.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.164.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.164.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.164.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.164.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.164.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.165.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.165.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.165.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.165.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.165.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.165.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.166.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.166.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.166.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.166.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.166.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.166.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.167.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.167.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.167.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.167.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.167.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.167.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.168.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.168.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.168.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.168.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.168.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.168.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.169.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.169.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.169.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.169.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.169.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.169.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.170.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.170.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.170.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.170.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.170.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.170.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.171.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.171.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.171.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.171.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.171.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.171.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.172.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.172.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.172.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.172.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.172.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.172.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.173.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.173.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.173.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.173.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.173.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.173.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.174.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.174.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.174.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.174.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.174.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.174.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.175.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.175.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.175.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.175.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.175.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.175.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.176.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.176.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.176.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.176.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.176.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.176.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.177.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.177.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.177.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.177.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.177.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.177.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.178.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.178.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.178.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.178.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.178.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.178.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.179.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.179.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.179.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.179.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.179.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.179.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.180.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.180.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.180.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.180.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.180.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.180.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.181.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.181.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.181.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.181.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.181.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.181.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.182.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.182.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.182.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.182.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.182.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.182.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.183.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.183.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.183.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.183.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.183.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.183.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.184.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.184.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.184.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.184.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.184.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.184.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.185.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.185.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.185.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.185.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.185.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.185.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.186.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.186.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.186.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.186.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.186.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.186.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.187.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.187.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.187.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.187.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.187.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.187.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.188.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.188.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.188.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.188.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.188.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.188.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.189.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.189.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.189.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.189.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.189.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.189.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.190.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.190.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.190.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.190.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.190.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.190.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.191.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.191.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.191.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.191.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.191.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.191.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.192.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.192.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.192.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.192.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.192.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.192.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.193.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.193.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.193.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.193.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.193.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.193.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.194.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.194.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.194.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.194.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.194.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.194.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.195.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.195.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.195.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.195.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.195.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.195.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.196.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.196.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.196.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.196.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.196.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.196.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.197.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.197.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.197.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.197.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.197.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.197.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.198.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.198.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.198.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.198.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.198.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.198.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.199.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.199.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.199.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.199.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.199.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.199.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.200.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.200.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.200.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.200.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.200.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.200.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.201.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.201.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.201.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.201.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.201.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.201.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.202.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.202.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.202.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.202.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.202.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.202.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.203.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.203.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.203.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.203.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.203.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.203.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.204.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.204.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.204.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.204.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.204.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.204.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.205.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.205.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.205.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.205.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.205.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.205.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.206.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.206.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.206.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.206.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.206.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.206.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.207.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.207.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.207.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.207.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.207.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.207.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.208.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.208.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.208.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.208.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.208.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.208.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.209.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.209.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.209.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.209.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.209.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.209.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.210.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.210.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.210.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.210.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.210.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.210.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.211.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.211.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.211.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.211.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.211.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.211.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.212.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.212.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.212.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.212.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.212.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.212.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.213.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.213.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.213.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.213.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.213.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.213.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.214.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.214.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.214.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.214.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.214.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.214.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.215.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.215.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.215.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.215.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.215.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.215.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.216.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.216.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.216.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.216.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.216.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.216.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.217.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.217.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.217.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.217.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.217.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.217.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.218.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.218.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.218.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.218.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.218.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.218.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.219.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.219.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.219.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.219.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.219.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.219.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.220.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.220.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.220.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.220.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.220.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.220.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.221.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.221.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.221.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.221.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.221.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.221.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.222.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.222.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.222.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.222.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.222.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.222.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.223.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.223.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.223.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.223.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.223.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.223.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.224.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.224.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.224.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.224.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.224.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.224.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.225.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.225.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.225.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.225.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.225.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.225.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.226.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.226.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.226.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.226.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.226.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.226.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.227.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.227.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.227.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.227.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.227.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.227.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.228.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.228.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.228.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.228.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.228.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.228.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.229.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.229.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.229.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.229.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.229.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.229.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.230.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.230.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.230.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.230.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.230.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.230.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.231.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.231.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.231.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.231.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.231.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.231.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.232.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.232.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.232.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.232.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.232.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.232.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.233.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.233.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.233.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.233.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.233.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.233.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.234.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.234.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.234.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.234.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.234.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.234.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.235.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.235.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.235.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.235.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.235.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.235.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.236.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.236.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.236.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.236.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.236.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.236.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.237.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.237.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.237.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.237.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.237.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.237.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.238.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.238.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.238.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.238.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.238.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.238.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.239.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.239.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.239.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.239.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.239.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.239.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.240.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.240.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.240.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.240.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.240.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.240.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.241.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.241.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.241.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.241.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.241.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.241.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.242.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.242.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.242.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.242.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.242.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.242.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.243.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.243.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.243.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.243.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.243.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.243.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.244.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.244.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.244.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.244.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.244.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.244.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.245.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.245.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.245.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.245.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.245.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.245.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.246.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.246.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.246.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.246.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.246.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.246.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.247.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.247.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.247.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.247.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.247.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.247.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.248.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.248.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.248.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.248.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.248.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.248.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.249.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.249.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.249.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.249.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.249.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.249.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.250.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.250.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.250.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.250.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.250.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.250.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.251.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.251.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.251.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.251.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.251.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.251.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.252.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.252.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.252.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.252.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.252.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.252.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.253.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.253.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.253.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.253.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.253.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.253.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.254.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.254.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.254.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.254.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.254.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.254.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.255.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.255.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.255.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.255.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.255.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.255.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.input_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.32.post_attention_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.q_a_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.q_a_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.q_a_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.q_b_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.q_b_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.kv_b_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.kv_b_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.o_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.o_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.gate.weight": "model-00084-of-000163.safetensors", "model.layers.33.mlp.gate.e_score_correction_bias": "model-00084-of-000163.safetensors", "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.shared_experts.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.shared_experts.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.0.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.0.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.0.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.0.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.0.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.1.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.1.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.1.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.1.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.1.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.2.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.2.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.2.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.2.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.2.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.3.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.3.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.3.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.3.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.3.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.4.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.4.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.4.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.4.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.4.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.5.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.5.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.5.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.5.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.5.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.6.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.6.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.6.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.6.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.6.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.7.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.7.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.7.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.7.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.7.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.8.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.8.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.8.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.8.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.8.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.9.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.9.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.9.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.9.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.9.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.10.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.10.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.10.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.10.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.10.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.11.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.11.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.11.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.11.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.11.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.12.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.12.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.12.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.12.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.12.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.13.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.13.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.13.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.13.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.13.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.14.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.14.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.14.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.14.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.14.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.15.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.15.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.15.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.15.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.15.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.16.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.16.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.16.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.16.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.16.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.17.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.17.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.17.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.17.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.17.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.18.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.18.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.18.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.18.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.18.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.19.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.19.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.19.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.19.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.19.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.20.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.20.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.20.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.20.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.20.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.21.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.21.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.21.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.21.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.21.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.22.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.22.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.22.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.22.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.22.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.23.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.23.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.23.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.23.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.23.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.24.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.24.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.24.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.24.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.24.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.25.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.25.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.25.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.25.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.25.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.26.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.26.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.26.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.26.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.26.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.27.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.27.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.27.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.27.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.27.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.28.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.28.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.28.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.28.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.28.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.29.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.29.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.29.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.29.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.29.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.30.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.30.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.30.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.30.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.30.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.31.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.31.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.31.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.31.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.31.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.32.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.32.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.32.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.32.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.32.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.33.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.33.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.33.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.33.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.33.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.34.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.34.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.34.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.34.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.34.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.35.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.35.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.35.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.35.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.35.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.36.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.36.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.36.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.36.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.36.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.37.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.37.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.37.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.37.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.37.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.38.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.38.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.38.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.38.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.38.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.39.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.39.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.39.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.39.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.39.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.40.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.40.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.40.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.40.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.40.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.41.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.41.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.41.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.41.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.41.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.42.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.42.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.42.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.42.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.42.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.43.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.43.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.43.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.43.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.43.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.44.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.44.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.44.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.44.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.44.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.45.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.45.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.45.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.45.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.45.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.46.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.46.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.46.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.46.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.46.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.47.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.47.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.47.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.47.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.47.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.48.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.48.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.48.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.48.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.48.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.49.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.49.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.49.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.49.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.49.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.50.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.50.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.50.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.50.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.50.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.51.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.51.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.51.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.51.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.51.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.52.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.52.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.52.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.52.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.52.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.53.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.53.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.53.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.53.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.53.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.54.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.54.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.54.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.54.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.54.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.55.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.55.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.55.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.55.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.55.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.56.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.56.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.56.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.56.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.56.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.57.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.57.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.57.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.57.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.57.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.58.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.58.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.58.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.58.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.58.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.59.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.59.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.59.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.59.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.59.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.60.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.60.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.60.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.60.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.60.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.61.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.61.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.61.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.61.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.61.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.62.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.62.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.62.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.62.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.62.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.63.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.63.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.63.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.63.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.63.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.64.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.64.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.64.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.64.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.64.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.65.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.65.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.65.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.65.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.65.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.66.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.66.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.66.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.66.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.66.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.67.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.67.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.67.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.67.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.67.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.68.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.68.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.68.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.68.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.68.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.69.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.69.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.69.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.69.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.69.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.70.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.70.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.70.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.70.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.70.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.71.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.71.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.71.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.71.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.71.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.72.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.72.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.72.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.72.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.72.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.73.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.73.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.73.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.73.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.73.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.74.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.74.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.74.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.74.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.74.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.75.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.75.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.75.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.75.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.75.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.76.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.76.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.76.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.76.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.76.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.77.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.77.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.77.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.77.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.77.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.78.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.78.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.78.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.78.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.78.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.79.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.79.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.79.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.79.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.79.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.80.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.80.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.80.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.80.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.80.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.81.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.81.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.81.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.81.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.81.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.82.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.82.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.82.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.82.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.82.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.83.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.83.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.83.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.83.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.83.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.84.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.84.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.84.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.84.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.84.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.85.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.85.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.85.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.85.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.85.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.86.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.86.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.86.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.86.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.86.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.87.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.87.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.87.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.87.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.87.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.88.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.88.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.88.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.88.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.88.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.89.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.89.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.89.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.89.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.89.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.90.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.90.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.90.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.90.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.90.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.91.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.91.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.91.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.91.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.91.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.92.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.92.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.92.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.92.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.92.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.93.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.93.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.93.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.93.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.93.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.94.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.94.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.94.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.94.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.94.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.95.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.95.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.95.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.95.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.95.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.96.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.96.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.96.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.96.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.96.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.97.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.97.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.97.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.97.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.97.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.98.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.98.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.98.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.98.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.98.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.99.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.99.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.99.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.99.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.99.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.100.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.100.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.100.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.100.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.100.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.101.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.101.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.101.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.101.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.101.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.102.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.102.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.102.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.102.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.102.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.103.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.103.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.103.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.103.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.103.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.104.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.104.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.104.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.104.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.104.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.105.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.105.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.105.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.105.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.105.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.106.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.106.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.106.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.106.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.106.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.107.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.107.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.107.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.107.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.107.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.108.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.108.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.108.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.108.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.108.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.109.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.109.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.109.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.109.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.109.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.110.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.110.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.110.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.110.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.110.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.111.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.111.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.111.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.111.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.111.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.112.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.112.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.112.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.112.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.112.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.113.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.113.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.113.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.113.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.113.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.114.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.114.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.114.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.114.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.114.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.115.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.115.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.115.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.115.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.115.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.116.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.116.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.116.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.116.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.116.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.117.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.117.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.117.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.117.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.117.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.118.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.118.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.118.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.118.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.118.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.119.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.119.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.119.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.119.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.119.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.120.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.120.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.120.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.120.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.120.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.121.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.121.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.121.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.121.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.121.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.122.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.122.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.122.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.122.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.122.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.123.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.123.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.123.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.123.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.123.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.124.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.124.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.124.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.124.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.124.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.125.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.125.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.125.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.125.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.125.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.126.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.126.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.126.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.126.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.126.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.127.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.127.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.127.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.127.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.127.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.128.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.128.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.128.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.128.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.128.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.129.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.129.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.129.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.129.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.129.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.130.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.130.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.130.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.130.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.130.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.131.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.131.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.131.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.131.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.131.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.132.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.132.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.132.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.132.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.132.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.133.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.133.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.133.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.133.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.133.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.134.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.134.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.134.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.134.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.134.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.135.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.135.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.135.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.135.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.135.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.136.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.136.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.136.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.136.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.136.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.137.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.137.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.137.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.137.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.137.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.138.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.138.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.138.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.138.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.138.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.139.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.139.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.139.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.139.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.139.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.140.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.140.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.140.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.140.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.140.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.141.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.141.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.141.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.141.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.141.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.142.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.142.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.142.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.142.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.142.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.143.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.143.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.143.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.143.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.143.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.144.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.144.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.144.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.144.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.144.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.145.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.145.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.145.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.145.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.145.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.146.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.146.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.146.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.146.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.146.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.147.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.147.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.147.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.147.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.147.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.148.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.148.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.148.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.148.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.148.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.149.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.149.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.149.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.149.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.149.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.150.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.150.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.150.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.150.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.150.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.151.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.151.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.151.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.151.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.151.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.152.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.152.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.152.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.152.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.152.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.153.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.153.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.153.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.153.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.153.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.154.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.154.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.154.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.154.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.154.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.155.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.155.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.155.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.155.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.155.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.156.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.156.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.156.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.156.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.156.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.157.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.157.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.157.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.157.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.157.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.158.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.158.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.158.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.158.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.158.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.159.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.159.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.159.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.159.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.159.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.160.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.160.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.160.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.160.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.160.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.160.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.161.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.161.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.161.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.161.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.161.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.161.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.162.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.162.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.162.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.162.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.162.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.162.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.163.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.163.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.163.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.163.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.163.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.163.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.164.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.164.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.164.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.164.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.164.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.164.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.165.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.165.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.165.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.165.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.165.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.165.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.166.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.166.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.166.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.166.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.166.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.166.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.167.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.167.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.167.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.167.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.167.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.167.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.168.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.168.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.168.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.168.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.168.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.168.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.169.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.169.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.169.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.169.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.169.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.169.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.170.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.170.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.170.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.170.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.170.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.170.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.171.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.171.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.171.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.171.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.171.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.171.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.172.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.172.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.172.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.172.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.172.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.172.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.173.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.173.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.173.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.173.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.173.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.173.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.174.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.174.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.174.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.174.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.174.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.174.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.175.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.175.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.175.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.175.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.175.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.175.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.176.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.176.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.176.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.176.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.176.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.176.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.177.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.177.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.177.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.177.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.177.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.177.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.178.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.178.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.178.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.178.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.178.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.178.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.179.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.179.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.179.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.179.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.179.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.179.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.180.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.180.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.180.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.180.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.180.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.180.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.181.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.181.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.181.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.181.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.181.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.181.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.182.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.182.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.182.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.182.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.182.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.182.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.183.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.183.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.183.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.183.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.183.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.183.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.184.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.184.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.184.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.184.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.184.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.184.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.185.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.185.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.185.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.185.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.185.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.185.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.186.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.186.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.186.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.186.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.186.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.186.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.187.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.187.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.187.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.187.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.187.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.187.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.188.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.188.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.188.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.188.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.188.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.188.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.189.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.189.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.189.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.189.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.189.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.189.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.190.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.190.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.190.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.190.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.190.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.190.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.191.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.191.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.191.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.191.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.191.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.191.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.192.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.192.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.192.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.192.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.192.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.192.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.193.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.193.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.193.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.193.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.193.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.193.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.194.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.194.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.194.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.194.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.194.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.194.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.195.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.195.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.195.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.195.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.195.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.195.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.196.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.196.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.196.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.196.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.196.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.196.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.197.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.197.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.197.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.197.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.197.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.197.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.198.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.198.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.198.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.198.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.198.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.198.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.199.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.199.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.199.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.199.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.199.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.199.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.200.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.200.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.200.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.200.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.200.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.200.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.201.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.201.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.201.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.201.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.201.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.201.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.202.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.202.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.202.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.202.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.202.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.202.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.203.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.203.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.203.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.203.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.203.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.203.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.204.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.204.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.204.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.204.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.204.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.204.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.205.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.205.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.205.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.205.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.205.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.205.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.206.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.206.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.206.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.206.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.206.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.206.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.207.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.207.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.207.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.207.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.207.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.207.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.208.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.208.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.208.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.208.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.208.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.208.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.209.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.209.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.209.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.209.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.209.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.209.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.210.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.210.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.210.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.210.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.210.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.210.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.211.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.211.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.211.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.211.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.211.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.211.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.212.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.212.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.212.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.212.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.212.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.212.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.213.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.213.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.213.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.213.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.213.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.213.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.214.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.214.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.214.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.214.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.214.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.214.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.215.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.215.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.215.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.215.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.215.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.215.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.216.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.216.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.216.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.216.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.216.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.216.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.217.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.217.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.217.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.217.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.217.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.217.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.218.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.218.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.218.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.218.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.218.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.218.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.219.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.219.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.219.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.219.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.219.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.219.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.220.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.220.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.220.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.220.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.220.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.220.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.221.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.221.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.221.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.221.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.221.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.221.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.222.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.222.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.222.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.222.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.222.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.222.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.223.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.223.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.223.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.223.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.223.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.223.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.224.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.224.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.224.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.224.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.224.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.224.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.225.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.225.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.225.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.225.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.225.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.225.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.226.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.226.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.226.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.226.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.226.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.226.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.227.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.227.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.227.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.227.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.227.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.227.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.228.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.228.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.228.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.228.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.228.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.228.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.229.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.229.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.229.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.229.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.229.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.229.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.230.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.230.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.230.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.230.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.230.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.230.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.231.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.231.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.231.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.231.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.231.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.231.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.232.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.232.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.232.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.232.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.232.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.232.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.233.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.233.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.233.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.233.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.233.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.233.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.234.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.234.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.234.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.234.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.234.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.234.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.235.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.235.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.235.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.235.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.235.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.235.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.236.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.236.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.236.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.236.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.236.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.236.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.237.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.237.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.237.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.237.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.237.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.237.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.238.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.238.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.238.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.238.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.238.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.238.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.239.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.239.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.239.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.239.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.239.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.239.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.240.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.240.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.240.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.240.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.240.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.240.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.241.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.241.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.241.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.241.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.241.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.241.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.242.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.242.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.242.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.242.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.242.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.242.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.243.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.243.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.243.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.243.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.243.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.243.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.244.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.244.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.244.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.244.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.244.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.244.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.245.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.245.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.245.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.245.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.245.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.245.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.246.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.246.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.246.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.246.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.246.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.246.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.247.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.247.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.247.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.247.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.247.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.247.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.248.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.248.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.248.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.248.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.248.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.248.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.249.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.249.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.249.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.249.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.249.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.249.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.250.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.250.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.250.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.250.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.250.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.250.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.251.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.251.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.251.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.251.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.251.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.251.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.252.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.252.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.252.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.252.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.252.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.252.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.253.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.253.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.253.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.253.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.253.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.253.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.254.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.254.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.254.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.254.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.254.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.254.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.255.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.255.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.255.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.255.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.255.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.255.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.input_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.33.post_attention_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.q_a_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.q_a_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.q_a_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.q_b_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.q_b_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.kv_b_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.kv_b_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.o_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.o_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.gate.weight": "model-00087-of-000163.safetensors", "model.layers.34.mlp.gate.e_score_correction_bias": "model-00087-of-000163.safetensors", "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.shared_experts.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.shared_experts.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.0.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.0.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.0.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.0.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.0.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.1.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.1.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.1.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.1.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.1.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.2.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.2.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.2.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.2.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.2.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.3.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.3.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.3.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.3.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.3.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.4.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.4.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.4.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.4.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.4.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.5.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.5.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.5.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.5.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.5.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.6.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.6.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.6.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.6.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.6.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.7.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.7.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.7.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.7.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.7.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.8.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.8.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.8.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.8.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.8.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.9.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.9.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.9.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.9.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.9.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.10.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.10.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.10.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.10.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.10.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.11.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.11.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.11.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.11.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.11.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.12.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.12.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.12.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.12.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.12.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.13.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.13.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.13.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.13.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.13.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.14.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.14.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.14.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.14.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.14.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.15.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.15.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.15.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.15.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.15.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.16.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.16.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.16.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.16.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.16.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.17.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.17.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.17.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.17.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.17.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.18.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.18.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.18.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.18.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.18.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.19.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.19.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.19.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.19.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.19.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.20.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.20.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.20.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.20.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.20.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.21.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.21.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.21.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.21.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.21.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.22.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.22.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.22.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.22.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.22.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.23.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.23.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.23.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.23.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.23.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.24.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.24.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.24.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.24.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.24.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.25.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.25.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.25.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.25.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.25.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.26.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.26.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.26.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.26.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.26.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.27.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.27.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.27.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.27.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.27.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.28.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.28.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.28.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.28.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.28.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.29.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.29.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.29.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.29.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.29.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.30.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.30.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.30.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.30.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.30.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.31.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.31.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.31.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.31.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.31.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.32.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.32.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.32.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.32.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.32.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.33.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.33.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.33.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.33.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.33.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.34.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.34.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.34.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.34.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.34.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.35.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.35.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.35.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.35.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.35.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.36.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.36.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.36.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.36.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.36.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.37.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.37.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.37.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.37.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.37.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.38.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.38.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.38.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.38.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.38.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.39.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.39.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.39.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.39.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.39.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.40.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.40.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.40.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.40.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.40.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.41.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.41.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.41.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.41.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.41.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.42.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.42.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.42.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.42.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.42.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.43.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.43.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.43.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.43.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.43.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.44.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.44.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.44.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.44.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.44.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.45.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.45.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.45.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.45.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.45.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.46.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.46.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.46.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.46.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.46.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.47.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.47.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.47.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.47.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.47.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.48.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.48.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.48.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.48.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.48.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.49.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.49.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.49.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.49.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.49.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.50.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.50.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.50.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.50.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.50.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.51.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.51.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.51.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.51.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.51.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.52.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.52.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.52.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.52.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.52.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.53.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.53.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.53.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.53.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.53.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.54.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.54.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.54.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.54.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.54.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.55.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.55.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.55.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.55.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.55.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.56.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.56.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.56.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.56.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.56.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.57.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.57.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.57.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.57.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.57.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.58.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.58.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.58.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.58.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.58.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.59.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.59.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.59.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.59.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.59.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.60.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.60.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.60.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.60.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.60.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.61.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.61.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.61.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.61.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.61.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.62.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.62.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.62.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.62.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.62.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.63.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.63.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.63.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.63.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.63.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.64.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.64.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.64.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.64.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.64.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.65.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.65.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.65.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.65.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.65.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.66.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.66.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.66.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.66.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.66.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.67.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.67.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.67.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.67.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.67.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.68.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.68.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.68.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.68.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.68.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.69.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.69.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.69.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.69.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.69.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.70.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.70.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.70.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.70.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.70.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.71.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.71.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.71.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.71.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.71.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.72.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.72.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.72.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.72.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.72.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.73.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.73.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.73.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.73.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.73.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.74.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.74.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.74.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.74.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.74.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.75.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.75.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.75.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.75.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.75.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.76.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.76.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.76.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.76.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.76.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.77.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.77.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.77.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.77.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.77.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.78.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.78.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.78.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.78.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.78.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.79.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.79.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.79.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.79.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.79.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.80.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.80.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.80.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.80.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.80.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.81.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.81.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.81.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.81.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.81.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.82.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.82.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.82.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.82.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.82.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.83.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.83.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.83.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.83.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.83.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.84.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.84.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.84.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.84.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.84.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.85.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.85.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.85.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.85.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.85.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.86.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.86.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.86.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.86.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.86.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.87.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.87.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.87.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.87.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.87.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.88.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.88.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.88.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.88.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.88.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.89.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.89.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.89.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.89.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.89.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.90.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.90.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.90.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.90.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.90.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.91.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.91.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.91.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.91.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.91.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.92.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.92.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.92.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.92.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.92.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.93.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.93.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.93.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.93.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.93.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.94.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.94.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.94.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.94.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.94.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.95.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.95.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.95.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.95.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.95.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.96.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.96.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.96.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.96.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.96.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.97.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.97.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.97.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.97.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.97.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.98.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.98.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.98.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.98.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.98.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.99.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.99.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.99.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.99.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.99.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.100.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.100.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.100.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.100.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.100.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.101.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.101.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.101.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.101.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.101.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.102.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.102.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.102.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.102.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.102.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.103.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.103.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.103.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.103.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.103.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.104.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.104.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.104.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.104.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.104.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.105.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.105.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.105.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.105.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.105.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.106.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.106.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.106.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.106.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.106.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.107.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.107.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.107.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.107.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.107.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.108.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.108.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.108.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.108.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.108.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.109.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.109.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.109.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.109.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.109.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.110.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.110.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.110.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.110.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.110.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.111.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.111.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.111.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.111.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.111.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.112.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.112.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.112.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.112.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.112.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.113.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.113.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.113.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.113.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.113.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.114.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.114.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.114.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.114.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.114.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.115.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.115.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.115.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.115.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.115.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.116.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.116.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.116.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.116.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.116.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.117.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.117.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.117.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.117.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.117.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.118.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.118.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.118.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.118.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.118.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.119.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.119.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.119.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.119.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.119.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.120.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.120.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.120.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.120.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.120.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.121.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.121.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.121.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.121.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.121.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.122.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.122.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.122.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.122.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.122.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.123.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.123.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.123.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.123.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.123.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.124.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.124.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.124.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.124.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.124.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.125.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.125.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.125.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.125.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.125.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.126.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.126.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.126.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.126.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.126.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.127.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.127.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.127.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.127.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.127.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.128.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.128.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.128.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.128.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.128.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.129.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.129.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.129.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.129.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.129.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.130.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.130.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.130.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.130.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.130.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.131.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.131.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.131.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.131.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.131.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.132.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.132.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.132.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.132.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.132.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.133.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.133.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.133.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.133.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.133.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.134.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.134.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.134.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.134.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.134.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.135.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.135.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.135.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.135.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.135.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.136.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.136.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.136.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.136.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.136.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.137.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.137.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.137.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.137.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.137.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.138.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.138.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.138.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.138.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.138.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.139.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.139.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.139.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.139.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.139.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.140.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.140.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.140.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.140.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.140.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.141.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.141.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.141.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.141.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.141.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.142.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.142.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.142.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.142.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.142.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.143.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.143.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.143.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.143.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.143.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.144.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.144.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.144.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.144.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.144.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.145.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.145.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.145.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.145.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.145.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.146.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.146.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.146.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.146.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.146.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.147.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.147.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.147.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.147.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.147.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.148.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.148.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.148.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.148.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.148.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.149.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.149.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.149.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.149.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.149.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.150.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.150.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.150.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.150.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.150.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.151.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.151.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.151.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.151.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.151.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.152.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.152.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.152.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.152.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.152.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.153.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.153.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.153.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.153.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.153.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.154.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.154.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.154.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.154.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.154.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.155.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.155.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.155.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.155.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.155.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.156.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.156.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.156.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.156.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.156.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.157.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.157.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.157.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.157.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.157.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.158.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.158.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.158.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.158.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.158.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.159.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.159.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.159.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.159.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.159.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.160.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.160.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.160.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.160.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.160.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.160.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.161.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.161.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.161.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.161.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.161.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.161.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.162.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.162.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.162.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.162.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.162.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.162.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.163.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.163.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.163.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.163.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.163.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.163.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.164.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.164.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.164.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.164.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.164.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.164.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.165.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.165.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.165.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.165.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.165.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.165.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.166.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.166.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.166.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.166.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.166.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.166.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.167.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.167.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.167.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.167.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.167.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.167.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.168.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.168.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.168.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.168.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.168.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.168.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.169.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.169.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.169.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.169.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.169.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.169.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.170.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.170.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.170.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.170.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.170.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.170.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.171.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.171.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.171.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.171.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.171.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.171.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.172.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.172.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.172.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.172.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.172.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.172.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.173.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.173.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.173.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.173.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.173.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.173.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.174.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.174.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.174.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.174.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.174.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.174.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.175.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.175.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.175.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.175.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.175.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.175.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.176.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.176.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.176.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.176.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.176.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.176.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.177.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.177.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.177.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.177.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.177.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.177.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.178.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.178.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.178.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.178.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.178.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.178.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.179.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.179.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.179.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.179.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.179.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.179.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.180.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.180.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.180.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.180.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.180.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.180.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.181.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.181.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.181.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.181.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.181.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.181.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.182.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.182.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.182.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.182.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.182.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.182.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.183.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.183.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.183.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.183.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.183.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.183.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.184.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.184.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.184.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.184.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.184.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.184.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.185.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.185.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.185.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.185.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.185.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.185.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.186.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.186.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.186.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.186.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.186.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.186.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.187.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.187.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.187.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.187.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.187.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.187.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.188.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.188.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.188.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.188.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.188.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.188.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.189.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.189.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.189.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.189.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.189.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.189.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.190.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.190.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.190.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.190.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.190.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.190.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.191.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.191.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.191.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.191.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.191.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.191.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.192.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.192.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.192.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.192.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.192.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.192.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.193.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.193.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.193.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.193.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.193.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.193.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.194.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.194.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.194.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.194.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.194.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.194.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.195.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.195.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.195.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.195.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.195.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.195.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.196.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.196.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.196.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.196.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.196.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.196.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.197.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.197.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.197.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.197.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.197.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.197.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.198.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.198.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.198.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.198.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.198.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.198.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.199.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.199.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.199.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.199.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.199.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.199.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.200.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.200.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.200.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.200.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.200.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.200.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.201.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.201.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.201.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.201.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.201.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.201.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.202.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.202.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.202.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.202.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.202.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.202.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.203.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.203.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.203.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.203.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.203.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.203.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.204.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.204.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.204.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.204.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.204.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.204.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.205.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.205.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.205.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.205.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.205.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.205.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.206.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.206.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.206.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.206.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.206.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.206.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.207.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.207.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.207.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.207.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.207.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.207.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.208.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.208.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.208.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.208.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.208.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.208.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.209.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.209.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.209.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.209.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.209.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.209.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.210.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.210.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.210.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.210.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.210.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.210.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.211.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.211.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.211.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.211.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.211.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.211.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.212.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.212.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.212.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.212.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.212.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.212.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.213.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.213.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.213.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.213.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.213.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.213.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.214.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.214.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.214.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.214.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.214.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.214.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.215.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.215.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.215.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.215.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.215.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.215.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.216.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.216.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.216.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.216.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.216.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.216.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.217.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.217.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.217.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.217.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.217.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.217.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.218.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.218.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.218.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.218.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.218.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.218.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.219.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.219.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.219.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.219.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.219.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.219.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.220.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.220.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.220.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.220.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.220.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.220.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.221.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.221.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.221.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.221.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.221.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.221.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.222.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.222.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.222.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.222.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.222.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.222.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.223.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.223.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.223.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.223.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.223.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.223.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.224.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.224.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.224.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.224.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.224.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.224.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.225.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.225.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.225.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.225.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.225.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.225.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.226.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.226.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.226.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.226.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.226.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.226.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.227.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.227.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.227.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.227.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.227.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.227.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.228.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.228.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.228.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.228.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.228.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.228.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.229.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.229.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.229.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.229.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.229.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.229.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.230.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.230.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.230.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.230.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.230.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.230.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.231.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.231.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.231.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.231.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.231.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.231.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.232.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.232.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.232.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.232.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.232.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.232.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.233.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.233.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.233.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.233.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.233.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.233.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.234.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.234.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.234.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.234.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.234.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.234.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.235.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.235.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.235.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.235.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.235.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.235.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.236.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.236.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.236.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.236.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.236.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.236.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.237.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.237.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.237.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.237.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.237.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.237.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.238.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.238.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.238.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.238.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.238.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.238.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.239.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.239.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.239.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.239.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.239.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.239.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.240.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.240.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.240.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.240.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.240.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.240.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.241.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.241.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.241.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.241.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.241.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.241.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.242.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.242.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.242.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.242.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.242.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.242.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.243.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.243.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.243.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.243.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.243.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.243.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.244.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.244.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.244.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.244.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.244.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.244.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.245.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.245.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.245.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.245.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.245.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.245.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.246.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.246.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.246.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.246.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.246.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.246.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.247.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.247.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.247.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.247.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.247.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.247.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.248.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.248.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.248.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.248.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.248.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.248.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.249.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.249.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.249.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.249.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.249.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.249.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.250.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.250.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.250.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.250.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.250.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.250.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.251.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.251.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.251.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.251.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.251.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.251.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.252.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.252.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.252.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.252.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.252.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.252.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.253.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.253.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.253.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.253.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.253.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.253.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.254.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.254.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.254.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.254.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.254.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.254.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.255.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.255.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.255.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.255.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.255.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.255.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.input_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.34.post_attention_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.q_a_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.q_a_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.q_a_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.q_b_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.q_b_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.kv_b_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.kv_b_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.o_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.o_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.gate.weight": "model-00089-of-000163.safetensors", "model.layers.35.mlp.gate.e_score_correction_bias": "model-00089-of-000163.safetensors", "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.shared_experts.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.shared_experts.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.0.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.0.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.0.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.0.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.0.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.1.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.1.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.1.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.1.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.1.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.2.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.2.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.2.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.2.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.2.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.3.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.3.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.3.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.3.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.3.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.4.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.4.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.4.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.4.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.4.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.5.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.5.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.5.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.5.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.5.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.6.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.6.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.6.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.6.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.6.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.7.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.7.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.7.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.7.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.7.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.8.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.8.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.8.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.8.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.8.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.9.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.9.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.9.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.9.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.9.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.10.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.10.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.10.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.10.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.10.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.11.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.11.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.11.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.11.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.11.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.12.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.12.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.12.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.12.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.12.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.13.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.13.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.13.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.13.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.13.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.14.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.14.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.14.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.14.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.14.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.15.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.15.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.15.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.15.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.15.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.16.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.16.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.16.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.16.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.16.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.17.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.17.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.17.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.17.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.17.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.18.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.18.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.18.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.18.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.18.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.19.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.19.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.19.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.19.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.19.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.20.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.20.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.20.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.20.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.20.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.21.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.21.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.21.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.21.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.21.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.22.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.22.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.22.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.22.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.22.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.23.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.23.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.23.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.23.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.23.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.24.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.24.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.24.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.24.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.24.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.25.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.25.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.25.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.25.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.25.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.26.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.26.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.26.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.26.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.26.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.27.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.27.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.27.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.27.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.27.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.28.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.28.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.28.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.28.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.28.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.29.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.29.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.29.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.29.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.29.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.30.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.30.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.30.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.30.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.30.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.31.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.31.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.31.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.31.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.31.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.32.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.32.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.32.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.32.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.32.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.33.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.33.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.33.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.33.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.33.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.34.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.34.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.34.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.34.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.34.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.35.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.35.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.35.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.35.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.35.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.36.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.36.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.36.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.36.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.36.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.37.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.37.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.37.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.37.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.37.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.38.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.38.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.38.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.38.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.38.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.39.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.39.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.39.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.39.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.39.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.40.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.40.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.40.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.40.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.40.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.41.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.41.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.41.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.41.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.41.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.42.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.42.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.42.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.42.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.42.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.43.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.43.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.43.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.43.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.43.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.44.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.44.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.44.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.44.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.44.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.45.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.45.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.45.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.45.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.45.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.46.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.46.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.46.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.46.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.46.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.47.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.47.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.47.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.47.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.47.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.48.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.48.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.48.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.48.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.48.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.49.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.49.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.49.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.49.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.49.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.50.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.50.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.50.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.50.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.50.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.51.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.51.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.51.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.51.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.51.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.52.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.52.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.52.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.52.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.52.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.53.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.53.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.53.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.53.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.53.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.54.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.54.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.54.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.54.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.54.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.55.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.55.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.55.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.55.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.55.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.56.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.56.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.56.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.56.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.56.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.57.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.57.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.57.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.57.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.57.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.58.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.58.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.58.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.58.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.58.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.59.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.59.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.59.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.59.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.59.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.60.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.60.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.60.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.60.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.60.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.61.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.61.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.61.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.61.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.61.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.62.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.62.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.62.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.62.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.62.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.63.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.63.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.63.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.63.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.63.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.64.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.64.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.64.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.64.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.64.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.65.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.65.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.65.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.65.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.65.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.66.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.66.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.66.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.66.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.66.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.67.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.67.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.67.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.67.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.67.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.68.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.68.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.68.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.68.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.68.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.69.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.69.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.69.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.69.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.69.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.70.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.70.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.70.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.70.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.70.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.71.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.71.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.71.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.71.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.71.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.72.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.72.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.72.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.72.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.72.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.73.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.73.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.73.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.73.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.73.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.74.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.74.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.74.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.74.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.74.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.75.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.75.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.75.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.75.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.75.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.76.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.76.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.76.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.76.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.76.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.77.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.77.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.77.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.77.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.77.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.78.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.78.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.78.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.78.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.78.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.79.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.79.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.79.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.79.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.79.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.80.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.80.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.80.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.80.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.80.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.81.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.81.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.81.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.81.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.81.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.82.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.82.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.82.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.82.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.82.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.83.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.83.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.83.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.83.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.83.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.84.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.84.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.84.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.84.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.84.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.85.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.85.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.85.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.85.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.85.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.86.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.86.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.86.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.86.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.86.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.87.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.87.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.87.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.87.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.87.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.88.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.88.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.88.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.88.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.88.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.89.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.89.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.89.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.89.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.89.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.90.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.90.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.90.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.90.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.90.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.91.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.91.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.91.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.91.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.91.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.92.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.92.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.92.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.92.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.92.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.93.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.93.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.93.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.93.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.93.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.94.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.94.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.94.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.94.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.94.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.95.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.95.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.95.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.95.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.95.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.96.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.96.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.96.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.96.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.96.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.97.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.97.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.97.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.97.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.97.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.98.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.98.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.98.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.98.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.98.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.99.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.99.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.99.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.99.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.99.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.100.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.100.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.100.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.100.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.100.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.101.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.101.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.101.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.101.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.101.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.102.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.102.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.102.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.102.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.102.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.103.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.103.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.103.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.103.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.103.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.104.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.104.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.104.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.104.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.104.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.105.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.105.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.105.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.105.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.105.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.106.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.106.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.106.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.106.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.106.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.107.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.107.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.107.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.107.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.107.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.108.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.108.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.108.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.108.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.108.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.109.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.109.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.109.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.109.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.109.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.110.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.110.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.110.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.110.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.110.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.111.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.111.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.111.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.111.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.111.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.112.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.112.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.112.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.112.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.112.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.113.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.113.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.113.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.113.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.113.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.114.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.114.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.114.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.114.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.114.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.115.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.115.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.115.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.115.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.115.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.116.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.116.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.116.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.116.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.116.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.117.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.117.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.117.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.117.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.117.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.118.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.118.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.118.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.118.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.118.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.119.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.119.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.119.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.119.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.119.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.120.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.120.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.120.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.120.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.120.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.121.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.121.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.121.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.121.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.121.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.122.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.122.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.122.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.122.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.122.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.123.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.123.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.123.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.123.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.123.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.124.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.124.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.124.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.124.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.124.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.125.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.125.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.125.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.125.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.125.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.126.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.126.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.126.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.126.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.126.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.127.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.127.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.127.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.127.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.127.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.128.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.128.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.128.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.128.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.128.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.129.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.129.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.129.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.129.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.129.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.130.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.130.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.130.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.130.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.130.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.131.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.131.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.131.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.131.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.131.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.132.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.132.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.132.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.132.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.132.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.133.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.133.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.133.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.133.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.133.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.134.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.134.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.134.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.134.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.134.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.135.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.135.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.135.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.135.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.135.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.136.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.136.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.136.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.136.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.136.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.137.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.137.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.137.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.137.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.137.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.138.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.138.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.138.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.138.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.138.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.139.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.139.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.139.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.139.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.139.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.140.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.140.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.140.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.140.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.140.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.141.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.141.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.141.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.141.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.141.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.142.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.142.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.142.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.142.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.142.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.143.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.143.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.143.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.143.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.143.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.144.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.144.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.144.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.144.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.144.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.145.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.145.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.145.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.145.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.145.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.146.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.146.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.146.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.146.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.146.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.147.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.147.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.147.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.147.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.147.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.148.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.148.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.148.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.148.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.148.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.149.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.149.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.149.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.149.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.149.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.150.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.150.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.150.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.150.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.150.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.151.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.151.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.151.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.151.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.151.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.152.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.152.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.152.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.152.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.152.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.153.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.153.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.153.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.153.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.153.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.154.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.154.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.154.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.154.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.154.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.155.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.155.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.155.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.155.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.155.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.156.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.156.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.156.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.156.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.156.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.157.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.157.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.157.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.157.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.157.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.158.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.158.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.158.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.158.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.158.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.159.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.159.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.159.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.159.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.159.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.160.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.160.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.160.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.160.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.160.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.160.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.161.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.161.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.161.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.161.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.161.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.161.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.162.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.162.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.162.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.162.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.162.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.162.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.163.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.163.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.163.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.163.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.163.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.163.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.164.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.164.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.164.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.164.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.164.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.164.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.165.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.165.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.165.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.165.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.165.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.165.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.166.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.166.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.166.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.166.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.166.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.166.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.167.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.167.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.167.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.167.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.167.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.167.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.168.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.168.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.168.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.168.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.168.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.168.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.169.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.169.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.169.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.169.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.169.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.169.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.170.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.170.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.170.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.170.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.170.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.170.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.171.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.171.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.171.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.171.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.171.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.171.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.172.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.172.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.172.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.172.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.172.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.172.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.173.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.173.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.173.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.173.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.173.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.173.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.174.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.174.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.174.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.174.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.174.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.174.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.175.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.175.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.175.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.175.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.175.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.175.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.176.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.176.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.176.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.176.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.176.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.176.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.177.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.177.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.177.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.177.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.177.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.177.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.178.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.178.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.178.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.178.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.178.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.178.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.179.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.179.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.179.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.179.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.179.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.179.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.180.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.180.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.180.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.180.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.180.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.180.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.181.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.181.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.181.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.181.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.181.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.181.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.182.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.182.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.182.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.182.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.182.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.182.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.183.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.183.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.183.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.183.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.183.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.183.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.184.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.184.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.184.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.184.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.184.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.184.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.185.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.185.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.185.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.185.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.185.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.185.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.186.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.186.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.186.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.186.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.186.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.186.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.187.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.187.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.187.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.187.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.187.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.187.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.188.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.188.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.188.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.188.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.188.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.188.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.189.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.189.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.189.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.189.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.189.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.189.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.190.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.190.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.190.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.190.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.190.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.190.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.191.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.191.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.191.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.191.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.191.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.191.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.192.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.192.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.192.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.192.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.192.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.192.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.193.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.193.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.193.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.193.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.193.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.193.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.194.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.194.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.194.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.194.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.194.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.194.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.195.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.195.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.195.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.195.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.195.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.195.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.196.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.196.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.196.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.196.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.196.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.196.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.197.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.197.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.197.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.197.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.197.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.197.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.198.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.198.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.198.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.198.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.198.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.198.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.199.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.199.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.199.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.199.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.199.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.199.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.200.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.200.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.200.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.200.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.200.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.200.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.201.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.201.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.201.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.201.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.201.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.201.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.202.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.202.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.202.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.202.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.202.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.202.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.203.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.203.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.203.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.203.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.203.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.203.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.204.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.204.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.204.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.204.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.204.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.204.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.205.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.205.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.205.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.205.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.205.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.205.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.206.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.206.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.206.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.206.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.206.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.206.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.207.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.207.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.207.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.207.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.207.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.207.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.208.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.208.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.208.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.208.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.208.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.208.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.209.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.209.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.209.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.209.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.209.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.209.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.210.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.210.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.210.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.210.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.210.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.210.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.211.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.211.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.211.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.211.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.211.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.211.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.212.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.212.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.212.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.212.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.212.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.212.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.213.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.213.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.213.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.213.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.213.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.213.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.214.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.214.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.214.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.214.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.214.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.214.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.215.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.215.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.215.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.215.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.215.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.215.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.216.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.216.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.216.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.216.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.216.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.216.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.217.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.217.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.217.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.217.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.217.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.217.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.218.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.218.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.218.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.218.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.218.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.218.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.219.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.219.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.219.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.219.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.219.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.219.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.220.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.220.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.220.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.220.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.220.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.220.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.221.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.221.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.221.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.221.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.221.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.221.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.222.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.222.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.222.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.222.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.222.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.222.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.223.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.223.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.223.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.223.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.223.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.223.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.224.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.224.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.224.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.224.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.224.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.224.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.225.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.225.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.225.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.225.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.225.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.225.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.226.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.226.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.226.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.226.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.226.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.226.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.227.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.227.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.227.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.227.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.227.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.227.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.228.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.228.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.228.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.228.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.228.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.228.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.229.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.229.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.229.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.229.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.229.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.229.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.230.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.230.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.230.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.230.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.230.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.230.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.231.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.231.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.231.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.231.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.231.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.231.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.232.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.232.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.232.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.232.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.232.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.232.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.233.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.233.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.233.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.233.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.233.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.233.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.234.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.234.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.234.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.234.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.234.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.234.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.235.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.235.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.235.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.235.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.235.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.235.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.236.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.236.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.236.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.236.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.236.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.236.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.237.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.237.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.237.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.237.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.237.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.237.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.238.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.238.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.238.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.238.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.238.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.238.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.239.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.239.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.239.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.239.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.239.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.239.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.240.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.240.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.240.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.240.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.240.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.240.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.241.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.241.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.241.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.241.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.241.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.241.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.242.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.242.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.242.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.242.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.242.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.242.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.243.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.243.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.243.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.243.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.243.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.243.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.244.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.244.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.244.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.244.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.244.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.244.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.245.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.245.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.245.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.245.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.245.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.245.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.246.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.246.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.246.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.246.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.246.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.246.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.247.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.247.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.247.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.247.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.247.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.247.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.248.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.248.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.248.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.248.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.248.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.248.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.249.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.249.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.249.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.249.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.249.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.249.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.250.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.250.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.250.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.250.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.250.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.250.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.251.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.251.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.251.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.251.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.251.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.251.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.252.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.252.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.252.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.252.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.252.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.252.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.253.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.253.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.253.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.253.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.253.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.253.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.254.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.254.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.254.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.254.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.254.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.254.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.255.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.255.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.255.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.255.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.255.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.255.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.input_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.35.post_attention_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.q_a_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.q_a_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.q_a_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.q_b_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.q_b_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.kv_b_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.kv_b_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.o_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.o_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.gate.weight": "model-00092-of-000163.safetensors", "model.layers.36.mlp.gate.e_score_correction_bias": "model-00092-of-000163.safetensors", "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.shared_experts.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.shared_experts.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.0.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.0.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.0.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.0.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.0.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.1.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.1.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.1.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.1.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.1.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.2.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.2.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.2.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.2.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.2.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.3.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.3.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.3.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.3.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.3.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.4.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.4.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.4.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.4.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.4.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.5.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.5.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.5.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.5.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.5.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.6.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.6.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.6.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.6.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.6.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.7.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.7.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.7.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.7.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.7.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.8.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.8.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.8.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.8.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.8.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.9.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.9.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.9.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.9.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.9.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.10.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.10.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.10.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.10.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.10.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.11.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.11.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.11.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.11.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.11.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.12.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.12.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.12.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.12.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.12.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.13.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.13.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.13.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.13.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.13.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.14.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.14.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.14.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.14.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.14.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.15.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.15.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.15.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.15.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.15.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.16.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.16.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.16.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.16.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.16.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.17.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.17.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.17.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.17.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.17.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.18.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.18.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.18.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.18.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.18.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.19.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.19.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.19.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.19.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.19.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.20.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.20.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.20.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.20.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.20.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.21.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.21.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.21.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.21.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.21.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.22.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.22.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.22.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.22.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.22.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.23.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.23.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.23.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.23.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.23.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.24.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.24.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.24.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.24.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.24.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.25.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.25.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.25.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.25.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.25.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.26.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.26.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.26.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.26.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.26.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.27.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.27.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.27.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.27.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.27.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.28.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.28.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.28.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.28.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.28.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.29.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.29.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.29.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.29.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.29.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.30.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.30.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.30.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.30.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.30.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.31.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.31.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.31.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.31.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.31.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.32.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.32.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.32.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.32.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.32.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.33.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.33.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.33.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.33.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.33.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.34.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.34.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.34.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.34.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.34.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.35.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.35.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.35.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.35.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.35.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.36.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.36.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.36.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.36.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.36.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.37.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.37.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.37.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.37.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.37.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.38.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.38.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.38.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.38.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.38.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.39.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.39.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.39.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.39.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.39.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.40.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.40.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.40.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.40.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.40.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.41.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.41.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.41.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.41.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.41.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.42.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.42.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.42.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.42.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.42.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.43.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.43.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.43.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.43.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.43.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.44.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.44.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.44.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.44.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.44.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.45.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.45.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.45.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.45.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.45.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.46.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.46.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.46.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.46.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.46.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.47.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.47.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.47.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.47.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.47.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.48.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.48.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.48.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.48.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.48.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.49.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.49.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.49.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.49.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.49.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.50.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.50.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.50.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.50.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.50.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.51.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.51.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.51.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.51.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.51.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.52.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.52.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.52.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.52.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.52.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.53.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.53.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.53.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.53.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.53.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.54.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.54.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.54.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.54.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.54.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.55.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.55.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.55.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.55.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.55.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.56.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.56.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.56.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.56.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.56.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.57.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.57.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.57.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.57.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.57.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.58.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.58.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.58.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.58.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.58.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.59.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.59.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.59.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.59.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.59.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.60.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.60.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.60.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.60.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.60.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.61.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.61.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.61.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.61.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.61.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.62.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.62.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.62.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.62.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.62.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.63.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.63.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.63.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.63.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.63.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.64.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.64.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.64.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.64.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.64.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.65.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.65.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.65.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.65.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.65.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.66.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.66.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.66.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.66.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.66.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.67.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.67.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.67.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.67.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.67.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.68.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.68.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.68.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.68.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.68.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.69.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.69.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.69.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.69.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.69.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.70.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.70.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.70.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.70.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.70.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.71.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.71.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.71.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.71.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.71.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.72.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.72.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.72.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.72.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.72.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.73.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.73.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.73.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.73.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.73.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.74.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.74.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.74.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.74.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.74.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.75.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.75.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.75.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.75.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.75.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.76.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.76.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.76.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.76.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.76.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.77.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.77.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.77.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.77.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.77.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.78.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.78.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.78.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.78.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.78.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.79.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.79.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.79.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.79.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.79.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.80.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.80.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.80.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.80.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.80.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.81.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.81.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.81.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.81.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.81.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.82.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.82.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.82.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.82.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.82.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.83.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.83.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.83.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.83.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.83.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.84.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.84.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.84.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.84.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.84.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.85.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.85.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.85.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.85.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.85.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.86.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.86.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.86.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.86.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.86.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.87.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.87.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.87.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.87.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.87.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.88.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.88.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.88.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.88.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.88.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.89.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.89.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.89.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.89.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.89.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.90.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.90.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.90.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.90.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.90.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.91.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.91.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.91.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.91.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.91.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.92.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.92.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.92.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.92.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.92.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.93.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.93.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.93.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.93.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.93.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.94.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.94.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.94.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.94.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.94.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.95.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.95.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.95.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.95.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.95.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.96.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.96.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.96.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.96.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.96.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.97.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.97.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.97.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.97.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.97.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.98.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.98.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.98.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.98.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.98.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.99.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.99.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.99.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.99.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.99.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.100.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.100.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.100.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.100.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.100.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.101.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.101.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.101.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.101.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.101.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.102.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.102.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.102.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.102.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.102.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.103.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.103.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.103.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.103.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.103.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.104.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.104.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.104.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.104.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.104.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.105.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.105.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.105.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.105.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.105.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.106.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.106.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.106.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.106.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.106.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.107.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.107.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.107.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.107.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.107.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.108.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.108.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.108.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.108.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.108.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.109.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.109.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.109.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.109.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.109.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.110.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.110.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.110.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.110.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.110.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.111.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.111.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.111.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.111.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.111.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.112.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.112.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.112.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.112.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.112.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.113.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.113.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.113.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.113.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.113.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.114.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.114.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.114.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.114.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.114.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.115.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.115.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.115.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.115.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.115.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.116.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.116.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.116.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.116.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.116.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.117.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.117.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.117.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.117.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.117.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.118.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.118.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.118.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.118.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.118.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.119.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.119.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.119.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.119.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.119.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.120.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.120.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.120.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.120.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.120.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.121.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.121.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.121.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.121.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.121.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.122.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.122.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.122.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.122.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.122.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.123.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.123.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.123.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.123.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.123.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.124.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.124.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.124.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.124.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.124.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.125.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.125.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.125.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.125.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.125.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.126.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.126.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.126.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.126.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.126.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.127.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.127.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.127.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.127.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.127.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.128.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.128.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.128.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.128.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.128.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.129.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.129.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.129.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.129.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.129.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.130.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.130.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.130.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.130.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.130.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.131.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.131.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.131.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.131.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.131.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.132.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.132.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.132.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.132.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.132.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.133.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.133.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.133.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.133.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.133.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.134.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.134.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.134.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.134.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.134.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.135.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.135.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.135.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.135.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.135.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.136.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.136.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.136.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.136.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.136.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.137.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.137.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.137.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.137.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.137.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.138.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.138.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.138.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.138.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.138.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.139.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.139.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.139.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.139.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.139.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.140.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.140.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.140.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.140.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.140.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.141.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.141.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.141.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.141.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.141.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.142.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.142.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.142.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.142.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.142.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.143.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.143.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.143.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.143.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.143.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.144.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.144.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.144.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.144.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.144.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.145.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.145.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.145.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.145.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.145.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.146.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.146.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.146.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.146.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.146.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.147.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.147.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.147.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.147.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.147.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.148.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.148.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.148.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.148.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.148.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.149.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.149.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.149.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.149.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.149.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.150.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.150.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.150.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.150.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.150.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.151.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.151.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.151.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.151.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.151.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.152.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.152.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.152.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.152.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.152.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.153.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.153.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.153.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.153.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.153.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.154.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.154.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.154.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.154.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.154.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.155.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.155.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.155.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.155.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.155.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.156.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.156.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.156.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.156.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.156.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.157.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.157.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.157.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.157.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.157.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.158.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.158.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.158.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.158.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.158.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.159.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.159.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.159.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.159.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.159.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.160.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.160.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.160.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.160.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.160.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.160.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.161.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.161.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.161.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.161.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.161.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.161.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.162.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.162.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.162.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.162.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.162.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.162.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.163.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.163.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.163.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.163.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.163.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.163.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.164.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.164.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.164.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.164.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.164.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.164.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.165.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.165.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.165.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.165.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.165.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.165.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.166.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.166.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.166.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.166.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.166.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.166.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.167.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.167.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.167.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.167.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.167.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.167.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.168.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.168.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.168.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.168.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.168.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.168.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.169.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.169.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.169.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.169.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.169.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.169.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.170.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.170.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.170.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.170.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.170.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.170.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.171.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.171.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.171.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.171.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.171.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.171.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.172.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.172.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.172.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.172.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.172.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.172.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.173.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.173.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.173.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.173.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.173.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.173.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.174.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.174.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.174.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.174.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.174.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.174.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.175.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.175.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.175.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.175.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.175.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.175.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.176.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.176.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.176.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.176.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.176.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.176.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.177.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.177.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.177.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.177.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.177.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.177.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.178.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.178.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.178.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.178.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.178.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.178.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.179.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.179.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.179.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.179.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.179.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.179.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.180.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.180.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.180.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.180.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.180.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.180.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.181.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.181.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.181.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.181.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.181.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.181.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.182.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.182.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.182.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.182.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.182.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.182.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.183.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.183.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.183.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.183.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.183.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.183.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.184.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.184.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.184.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.184.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.184.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.184.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.185.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.185.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.185.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.185.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.185.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.185.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.186.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.186.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.186.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.186.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.186.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.186.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.187.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.187.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.187.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.187.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.187.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.187.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.188.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.188.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.188.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.188.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.188.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.188.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.189.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.189.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.189.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.189.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.189.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.189.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.190.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.190.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.190.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.190.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.190.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.190.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.191.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.191.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.191.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.191.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.191.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.191.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.192.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.192.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.192.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.192.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.192.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.192.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.193.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.193.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.193.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.193.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.193.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.193.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.194.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.194.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.194.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.194.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.194.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.194.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.195.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.195.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.195.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.195.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.195.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.195.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.196.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.196.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.196.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.196.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.196.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.196.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.197.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.197.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.197.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.197.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.197.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.197.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.198.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.198.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.198.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.198.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.198.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.198.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.199.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.199.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.199.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.199.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.199.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.199.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.200.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.200.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.200.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.200.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.200.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.200.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.201.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.201.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.201.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.201.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.201.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.201.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.202.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.202.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.202.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.202.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.202.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.202.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.203.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.203.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.203.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.203.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.203.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.203.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.204.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.204.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.204.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.204.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.204.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.204.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.205.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.205.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.205.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.205.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.205.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.205.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.206.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.206.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.206.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.206.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.206.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.206.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.207.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.207.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.207.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.207.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.207.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.207.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.208.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.208.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.208.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.208.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.208.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.208.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.209.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.209.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.209.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.209.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.209.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.209.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.210.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.210.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.210.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.210.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.210.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.210.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.211.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.211.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.211.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.211.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.211.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.211.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.212.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.212.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.212.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.212.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.212.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.212.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.213.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.213.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.213.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.213.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.213.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.213.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.214.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.214.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.214.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.214.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.214.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.214.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.215.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.215.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.215.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.215.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.215.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.215.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.216.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.216.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.216.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.216.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.216.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.216.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.217.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.217.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.217.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.217.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.217.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.217.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.218.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.218.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.218.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.218.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.218.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.218.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.219.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.219.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.219.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.219.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.219.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.219.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.220.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.220.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.220.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.220.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.220.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.220.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.221.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.221.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.221.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.221.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.221.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.221.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.222.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.222.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.222.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.222.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.222.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.222.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.223.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.223.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.223.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.223.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.223.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.223.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.224.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.224.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.224.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.224.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.224.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.224.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.225.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.225.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.225.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.225.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.225.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.225.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.226.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.226.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.226.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.226.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.226.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.226.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.227.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.227.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.227.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.227.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.227.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.227.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.228.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.228.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.228.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.228.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.228.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.228.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.229.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.229.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.229.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.229.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.229.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.229.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.230.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.230.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.230.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.230.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.230.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.230.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.231.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.231.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.231.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.231.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.231.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.231.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.232.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.232.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.232.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.232.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.232.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.232.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.233.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.233.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.233.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.233.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.233.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.233.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.234.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.234.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.234.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.234.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.234.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.234.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.235.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.235.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.235.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.235.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.235.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.235.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.236.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.236.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.236.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.236.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.236.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.236.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.237.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.237.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.237.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.237.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.237.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.237.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.238.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.238.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.238.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.238.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.238.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.238.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.239.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.239.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.239.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.239.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.239.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.239.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.240.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.240.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.240.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.240.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.240.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.240.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.241.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.241.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.241.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.241.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.241.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.241.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.242.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.242.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.242.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.242.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.242.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.242.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.243.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.243.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.243.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.243.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.243.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.243.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.244.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.244.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.244.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.244.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.244.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.244.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.245.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.245.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.245.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.245.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.245.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.245.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.246.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.246.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.246.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.246.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.246.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.246.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.247.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.247.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.247.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.247.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.247.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.247.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.248.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.248.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.248.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.248.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.248.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.248.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.249.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.249.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.249.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.249.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.249.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.249.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.250.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.250.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.250.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.250.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.250.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.250.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.251.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.251.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.251.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.251.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.251.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.251.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.252.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.252.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.252.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.252.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.252.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.252.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.253.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.253.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.253.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.253.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.253.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.253.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.254.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.254.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.254.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.254.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.254.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.254.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.255.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.255.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.255.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.255.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.255.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.255.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.input_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.36.post_attention_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.q_a_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.q_a_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.q_a_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.q_b_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.q_b_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.kv_b_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.kv_b_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.o_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.o_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.gate.weight": "model-00095-of-000163.safetensors", "model.layers.37.mlp.gate.e_score_correction_bias": "model-00095-of-000163.safetensors", "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.shared_experts.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.shared_experts.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.0.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.0.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.0.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.0.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.0.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.1.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.1.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.1.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.1.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.1.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.2.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.2.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.2.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.2.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.2.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.3.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.3.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.3.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.3.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.3.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.4.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.4.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.4.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.4.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.4.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.5.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.5.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.5.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.5.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.5.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.6.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.6.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.6.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.6.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.6.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.7.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.7.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.7.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.7.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.7.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.8.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.8.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.8.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.8.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.8.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.9.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.9.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.9.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.9.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.9.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.10.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.10.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.10.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.10.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.10.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.11.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.11.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.11.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.11.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.11.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.12.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.12.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.12.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.12.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.12.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.13.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.13.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.13.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.13.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.13.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.14.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.14.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.14.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.14.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.14.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.15.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.15.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.15.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.15.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.15.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.16.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.16.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.16.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.16.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.16.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.17.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.17.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.17.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.17.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.17.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.18.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.18.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.18.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.18.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.18.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.19.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.19.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.19.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.19.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.19.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.20.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.20.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.20.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.20.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.20.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.21.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.21.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.21.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.21.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.21.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.22.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.22.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.22.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.22.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.22.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.23.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.23.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.23.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.23.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.23.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.24.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.24.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.24.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.24.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.24.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.25.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.25.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.25.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.25.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.25.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.26.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.26.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.26.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.26.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.26.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.27.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.27.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.27.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.27.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.27.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.28.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.28.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.28.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.28.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.28.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.29.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.29.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.29.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.29.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.29.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.30.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.30.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.30.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.30.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.30.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.31.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.31.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.31.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.31.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.31.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.32.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.32.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.32.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.32.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.32.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.33.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.33.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.33.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.33.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.33.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.34.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.34.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.34.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.34.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.34.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.35.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.35.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.35.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.35.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.35.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.36.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.36.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.36.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.36.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.36.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.37.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.37.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.37.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.37.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.37.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.38.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.38.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.38.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.38.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.38.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.39.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.39.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.39.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.39.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.39.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.40.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.40.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.40.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.40.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.40.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.41.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.41.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.41.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.41.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.41.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.42.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.42.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.42.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.42.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.42.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.43.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.43.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.43.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.43.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.43.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.44.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.44.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.44.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.44.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.44.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.45.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.45.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.45.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.45.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.45.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.46.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.46.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.46.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.46.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.46.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.47.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.47.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.47.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.47.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.47.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.48.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.48.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.48.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.48.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.48.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.49.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.49.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.49.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.49.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.49.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.50.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.50.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.50.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.50.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.50.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.51.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.51.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.51.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.51.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.51.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.52.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.52.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.52.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.52.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.52.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.53.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.53.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.53.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.53.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.53.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.54.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.54.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.54.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.54.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.54.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.55.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.55.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.55.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.55.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.55.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.56.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.56.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.56.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.56.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.56.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.57.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.57.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.57.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.57.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.57.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.58.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.58.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.58.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.58.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.58.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.59.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.59.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.59.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.59.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.59.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.60.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.60.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.60.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.60.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.60.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.61.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.61.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.61.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.61.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.61.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.62.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.62.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.62.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.62.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.62.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.63.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.63.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.63.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.63.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.63.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.64.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.64.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.64.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.64.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.64.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.65.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.65.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.65.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.65.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.65.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.66.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.66.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.66.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.66.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.66.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.67.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.67.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.67.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.67.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.67.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.68.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.68.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.68.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.68.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.68.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.69.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.69.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.69.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.69.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.69.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.70.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.70.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.70.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.70.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.70.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.71.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.71.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.71.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.71.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.71.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.72.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.72.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.72.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.72.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.72.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.73.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.73.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.73.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.73.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.73.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.74.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.74.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.74.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.74.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.74.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.75.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.75.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.75.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.75.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.75.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.76.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.76.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.76.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.76.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.76.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.77.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.77.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.77.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.77.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.77.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.78.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.78.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.78.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.78.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.78.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.79.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.79.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.79.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.79.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.79.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.80.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.80.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.80.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.80.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.80.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.81.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.81.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.81.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.81.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.81.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.82.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.82.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.82.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.82.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.82.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.83.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.83.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.83.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.83.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.83.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.84.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.84.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.84.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.84.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.84.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.85.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.85.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.85.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.85.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.85.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.86.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.86.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.86.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.86.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.86.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.87.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.87.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.87.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.87.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.87.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.88.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.88.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.88.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.88.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.88.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.89.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.89.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.89.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.89.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.89.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.90.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.90.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.90.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.90.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.90.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.91.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.91.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.91.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.91.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.91.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.92.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.92.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.92.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.92.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.92.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.93.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.93.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.93.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.93.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.93.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.94.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.94.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.94.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.94.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.94.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.95.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.95.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.95.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.95.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.95.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.96.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.96.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.96.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.96.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.96.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.97.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.97.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.97.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.97.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.97.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.98.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.98.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.98.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.98.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.98.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.99.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.99.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.99.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.99.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.99.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.100.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.100.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.100.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.100.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.100.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.101.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.101.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.101.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.101.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.101.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.102.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.102.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.102.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.102.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.102.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.103.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.103.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.103.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.103.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.103.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.104.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.104.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.104.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.104.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.104.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.105.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.105.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.105.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.105.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.105.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.106.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.106.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.106.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.106.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.106.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.107.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.107.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.107.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.107.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.107.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.108.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.108.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.108.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.108.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.108.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.109.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.109.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.109.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.109.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.109.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.110.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.110.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.110.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.110.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.110.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.111.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.111.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.111.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.111.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.111.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.112.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.112.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.112.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.112.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.112.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.113.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.113.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.113.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.113.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.113.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.114.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.114.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.114.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.114.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.114.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.115.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.115.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.115.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.115.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.115.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.116.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.116.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.116.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.116.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.116.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.117.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.117.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.117.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.117.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.117.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.118.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.118.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.118.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.118.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.118.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.119.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.119.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.119.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.119.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.119.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.120.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.120.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.120.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.120.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.120.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.121.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.121.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.121.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.121.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.121.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.122.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.122.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.122.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.122.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.122.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.123.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.123.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.123.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.123.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.123.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.124.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.124.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.124.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.124.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.124.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.125.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.125.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.125.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.125.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.125.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.126.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.126.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.126.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.126.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.126.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.127.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.127.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.127.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.127.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.127.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.128.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.128.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.128.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.128.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.128.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.129.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.129.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.129.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.129.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.129.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.130.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.130.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.130.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.130.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.130.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.131.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.131.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.131.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.131.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.131.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.132.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.132.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.132.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.132.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.132.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.133.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.133.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.133.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.133.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.133.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.134.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.134.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.134.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.134.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.134.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.135.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.135.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.135.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.135.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.135.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.136.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.136.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.136.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.136.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.136.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.137.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.137.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.137.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.137.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.137.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.138.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.138.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.138.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.138.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.138.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.139.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.139.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.139.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.139.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.139.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.140.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.140.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.140.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.140.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.140.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.141.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.141.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.141.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.141.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.141.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.142.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.142.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.142.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.142.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.142.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.143.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.143.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.143.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.143.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.143.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.144.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.144.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.144.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.144.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.144.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.145.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.145.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.145.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.145.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.145.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.146.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.146.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.146.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.146.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.146.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.147.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.147.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.147.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.147.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.147.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.148.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.148.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.148.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.148.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.148.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.149.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.149.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.149.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.149.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.149.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.150.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.150.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.150.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.150.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.150.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.151.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.151.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.151.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.151.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.151.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.152.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.152.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.152.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.152.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.152.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.153.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.153.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.153.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.153.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.153.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.154.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.154.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.154.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.154.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.154.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.155.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.155.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.155.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.155.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.155.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.156.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.156.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.156.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.156.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.156.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.157.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.157.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.157.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.157.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.157.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.158.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.158.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.158.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.158.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.158.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.159.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.159.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.159.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.159.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.159.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.160.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.160.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.160.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.160.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.160.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.160.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.161.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.161.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.161.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.161.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.161.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.161.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.162.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.162.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.162.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.162.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.162.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.162.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.163.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.163.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.163.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.163.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.163.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.163.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.164.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.164.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.164.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.164.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.164.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.164.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.165.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.165.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.165.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.165.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.165.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.165.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.166.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.166.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.166.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.166.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.166.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.166.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.167.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.167.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.167.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.167.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.167.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.167.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.168.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.168.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.168.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.168.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.168.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.168.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.169.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.169.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.169.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.169.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.169.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.169.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.170.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.170.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.170.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.170.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.170.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.170.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.171.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.171.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.171.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.171.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.171.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.171.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.172.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.172.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.172.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.172.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.172.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.172.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.173.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.173.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.173.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.173.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.173.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.173.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.174.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.174.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.174.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.174.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.174.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.174.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.175.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.175.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.175.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.175.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.175.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.175.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.176.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.176.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.176.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.176.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.176.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.176.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.177.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.177.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.177.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.177.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.177.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.177.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.178.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.178.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.178.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.178.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.178.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.178.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.179.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.179.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.179.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.179.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.179.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.179.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.180.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.180.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.180.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.180.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.180.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.180.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.181.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.181.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.181.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.181.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.181.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.181.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.182.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.182.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.182.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.182.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.182.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.182.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.183.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.183.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.183.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.183.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.183.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.183.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.184.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.184.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.184.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.184.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.184.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.184.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.185.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.185.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.185.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.185.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.185.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.185.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.186.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.186.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.186.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.186.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.186.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.186.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.187.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.187.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.187.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.187.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.187.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.187.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.188.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.188.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.188.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.188.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.188.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.188.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.189.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.189.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.189.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.189.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.189.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.189.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.190.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.190.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.190.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.190.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.190.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.190.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.191.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.191.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.191.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.191.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.191.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.191.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.192.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.192.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.192.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.192.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.192.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.192.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.193.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.193.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.193.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.193.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.193.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.193.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.194.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.194.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.194.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.194.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.194.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.194.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.195.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.195.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.195.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.195.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.195.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.195.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.196.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.196.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.196.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.196.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.196.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.196.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.197.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.197.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.197.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.197.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.197.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.197.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.198.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.198.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.198.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.198.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.198.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.198.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.199.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.199.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.199.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.199.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.199.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.199.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.200.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.200.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.200.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.200.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.200.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.200.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.201.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.201.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.201.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.201.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.201.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.201.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.202.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.202.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.202.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.202.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.202.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.202.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.203.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.203.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.203.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.203.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.203.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.203.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.204.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.204.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.204.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.204.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.204.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.204.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.205.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.205.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.205.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.205.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.205.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.205.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.206.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.206.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.206.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.206.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.206.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.206.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.207.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.207.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.207.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.207.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.207.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.207.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.208.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.208.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.208.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.208.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.208.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.208.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.209.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.209.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.209.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.209.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.209.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.209.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.210.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.210.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.210.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.210.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.210.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.210.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.211.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.211.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.211.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.211.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.211.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.211.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.212.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.212.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.212.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.212.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.212.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.212.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.213.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.213.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.213.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.213.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.213.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.213.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.214.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.214.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.214.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.214.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.214.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.214.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.215.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.215.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.215.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.215.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.215.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.215.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.216.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.216.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.216.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.216.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.216.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.216.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.217.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.217.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.217.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.217.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.217.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.217.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.218.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.218.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.218.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.218.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.218.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.218.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.219.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.219.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.219.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.219.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.219.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.219.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.220.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.220.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.220.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.220.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.220.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.220.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.221.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.221.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.221.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.221.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.221.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.221.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.222.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.222.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.222.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.222.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.222.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.222.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.223.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.223.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.223.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.223.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.223.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.223.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.224.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.224.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.224.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.224.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.224.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.224.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.225.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.225.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.225.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.225.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.225.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.225.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.226.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.226.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.226.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.226.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.226.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.226.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.227.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.227.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.227.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.227.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.227.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.227.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.228.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.228.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.228.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.228.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.228.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.228.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.229.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.229.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.229.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.229.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.229.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.229.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.230.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.230.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.230.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.230.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.230.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.230.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.231.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.231.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.231.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.231.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.231.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.231.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.232.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.232.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.232.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.232.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.232.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.232.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.233.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.233.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.233.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.233.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.233.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.233.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.234.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.234.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.234.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.234.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.234.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.234.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.235.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.235.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.235.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.235.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.235.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.235.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.236.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.236.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.236.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.236.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.236.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.236.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.237.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.237.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.237.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.237.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.237.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.237.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.238.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.238.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.238.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.238.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.238.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.238.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.239.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.239.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.239.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.239.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.239.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.239.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.240.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.240.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.240.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.240.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.240.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.240.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.241.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.241.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.241.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.241.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.241.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.241.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.242.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.242.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.242.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.242.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.242.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.242.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.243.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.243.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.243.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.243.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.243.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.243.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.244.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.244.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.244.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.244.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.244.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.244.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.245.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.245.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.245.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.245.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.245.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.245.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.246.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.246.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.246.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.246.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.246.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.246.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.247.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.247.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.247.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.247.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.247.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.247.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.248.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.248.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.248.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.248.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.248.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.248.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.249.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.249.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.249.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.249.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.249.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.249.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.250.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.250.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.250.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.250.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.250.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.250.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.251.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.251.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.251.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.251.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.251.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.251.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.252.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.252.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.252.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.252.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.252.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.252.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.253.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.253.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.253.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.253.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.253.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.253.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.254.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.254.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.254.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.254.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.254.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.254.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.255.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.255.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.255.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.255.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.255.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.255.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.input_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.37.post_attention_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.q_a_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.q_a_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.q_a_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.q_b_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.q_b_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.kv_b_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.kv_b_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.o_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.o_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.gate.weight": "model-00097-of-000163.safetensors", "model.layers.38.mlp.gate.e_score_correction_bias": "model-00097-of-000163.safetensors", "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.shared_experts.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.shared_experts.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.0.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.0.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.0.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.0.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.0.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.1.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.1.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.1.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.1.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.1.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.2.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.2.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.2.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.2.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.2.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.3.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.3.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.3.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.3.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.3.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.4.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.4.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.4.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.4.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.4.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.5.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.5.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.5.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.5.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.5.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.6.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.6.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.6.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.6.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.6.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.7.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.7.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.7.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.7.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.7.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.8.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.8.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.8.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.8.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.8.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.9.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.9.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.9.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.9.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.9.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.10.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.10.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.10.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.10.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.10.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.11.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.11.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.11.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.11.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.11.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.12.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.12.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.12.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.12.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.12.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.13.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.13.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.13.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.13.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.13.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.14.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.14.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.14.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.14.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.14.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.15.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.15.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.15.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.15.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.15.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.16.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.16.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.16.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.16.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.16.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.17.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.17.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.17.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.17.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.17.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.18.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.18.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.18.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.18.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.18.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.19.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.19.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.19.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.19.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.19.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.20.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.20.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.20.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.20.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.20.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.21.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.21.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.21.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.21.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.21.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.22.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.22.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.22.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.22.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.22.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.23.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.23.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.23.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.23.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.23.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.24.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.24.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.24.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.24.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.24.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.25.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.25.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.25.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.25.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.25.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.26.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.26.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.26.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.26.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.26.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.27.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.27.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.27.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.27.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.27.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.28.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.28.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.28.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.28.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.28.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.29.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.29.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.29.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.29.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.29.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.30.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.30.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.30.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.30.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.30.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.31.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.31.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.31.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.31.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.31.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.32.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.32.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.32.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.32.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.32.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.33.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.33.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.33.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.33.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.33.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.34.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.34.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.34.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.34.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.34.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.35.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.35.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.35.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.35.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.35.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.36.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.36.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.36.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.36.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.36.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.37.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.37.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.37.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.37.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.37.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.38.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.38.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.38.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.38.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.38.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.39.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.39.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.39.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.39.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.39.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.40.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.40.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.40.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.40.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.40.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.41.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.41.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.41.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.41.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.41.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.42.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.42.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.42.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.42.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.42.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.43.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.43.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.43.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.43.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.43.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.44.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.44.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.44.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.44.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.44.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.45.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.45.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.45.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.45.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.45.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.46.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.46.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.46.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.46.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.46.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.47.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.47.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.47.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.47.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.47.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.48.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.48.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.48.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.48.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.48.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.49.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.49.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.49.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.49.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.49.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.50.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.50.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.50.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.50.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.50.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.51.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.51.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.51.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.51.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.51.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.52.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.52.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.52.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.52.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.52.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.53.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.53.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.53.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.53.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.53.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.54.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.54.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.54.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.54.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.54.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.55.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.55.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.55.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.55.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.55.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.56.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.56.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.56.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.56.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.56.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.57.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.57.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.57.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.57.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.57.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.58.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.58.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.58.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.58.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.58.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.59.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.59.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.59.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.59.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.59.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.60.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.60.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.60.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.60.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.60.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.61.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.61.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.61.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.61.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.61.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.62.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.62.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.62.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.62.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.62.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.63.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.63.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.63.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.63.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.63.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.64.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.64.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.64.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.64.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.64.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.65.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.65.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.65.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.65.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.65.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.66.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.66.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.66.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.66.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.66.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.67.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.67.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.67.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.67.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.67.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.68.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.68.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.68.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.68.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.68.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.69.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.69.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.69.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.69.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.69.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.70.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.70.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.70.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.70.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.70.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.71.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.71.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.71.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.71.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.71.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.72.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.72.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.72.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.72.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.72.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.73.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.73.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.73.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.73.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.73.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.74.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.74.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.74.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.74.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.74.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.75.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.75.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.75.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.75.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.75.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.76.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.76.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.76.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.76.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.76.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.77.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.77.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.77.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.77.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.77.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.78.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.78.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.78.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.78.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.78.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.79.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.79.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.79.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.79.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.79.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.80.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.80.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.80.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.80.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.80.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.81.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.81.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.81.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.81.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.81.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.82.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.82.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.82.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.82.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.82.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.83.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.83.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.83.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.83.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.83.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.84.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.84.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.84.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.84.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.84.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.85.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.85.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.85.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.85.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.85.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.86.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.86.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.86.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.86.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.86.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.87.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.87.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.87.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.87.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.87.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.88.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.88.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.88.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.88.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.88.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.89.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.89.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.89.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.89.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.89.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.90.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.90.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.90.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.90.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.90.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.91.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.91.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.91.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.91.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.91.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.92.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.92.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.92.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.92.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.92.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.93.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.93.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.93.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.93.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.93.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.94.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.94.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.94.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.94.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.94.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.95.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.95.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.95.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.95.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.95.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.96.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.96.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.96.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.96.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.96.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.97.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.97.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.97.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.97.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.97.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.98.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.98.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.98.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.98.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.98.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.99.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.99.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.99.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.99.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.99.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.100.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.100.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.100.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.100.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.100.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.101.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.101.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.101.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.101.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.101.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.102.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.102.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.102.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.102.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.102.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.103.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.103.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.103.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.103.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.103.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.104.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.104.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.104.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.104.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.104.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.105.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.105.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.105.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.105.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.105.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.106.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.106.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.106.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.106.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.106.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.107.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.107.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.107.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.107.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.107.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.108.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.108.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.108.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.108.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.108.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.109.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.109.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.109.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.109.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.109.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.110.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.110.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.110.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.110.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.110.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.111.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.111.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.111.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.111.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.111.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.112.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.112.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.112.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.112.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.112.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.113.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.113.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.113.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.113.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.113.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.114.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.114.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.114.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.114.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.114.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.115.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.115.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.115.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.115.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.115.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.116.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.116.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.116.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.116.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.116.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.117.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.117.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.117.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.117.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.117.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.118.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.118.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.118.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.118.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.118.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.119.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.119.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.119.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.119.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.119.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.120.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.120.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.120.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.120.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.120.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.121.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.121.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.121.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.121.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.121.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.122.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.122.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.122.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.122.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.122.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.123.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.123.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.123.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.123.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.123.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.124.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.124.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.124.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.124.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.124.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.125.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.125.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.125.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.125.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.125.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.126.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.126.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.126.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.126.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.126.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.127.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.127.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.127.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.127.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.127.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.128.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.128.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.128.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.128.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.128.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.129.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.129.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.129.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.129.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.129.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.130.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.130.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.130.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.130.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.130.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.131.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.131.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.131.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.131.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.131.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.132.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.132.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.132.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.132.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.132.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.133.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.133.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.133.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.133.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.133.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.134.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.134.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.134.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.134.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.134.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.135.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.135.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.135.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.135.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.135.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.136.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.136.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.136.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.136.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.136.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.137.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.137.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.137.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.137.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.137.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.138.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.138.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.138.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.138.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.138.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.139.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.139.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.139.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.139.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.139.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.140.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.140.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.140.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.140.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.140.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.141.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.141.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.141.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.141.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.141.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.142.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.142.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.142.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.142.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.142.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.143.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.143.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.143.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.143.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.143.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.144.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.144.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.144.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.144.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.144.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.145.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.145.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.145.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.145.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.145.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.146.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.146.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.146.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.146.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.146.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.147.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.147.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.147.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.147.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.147.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.148.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.148.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.148.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.148.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.148.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.149.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.149.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.149.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.149.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.149.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.150.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.150.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.150.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.150.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.150.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.151.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.151.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.151.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.151.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.151.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.152.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.152.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.152.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.152.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.152.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.153.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.153.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.153.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.153.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.153.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.154.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.154.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.154.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.154.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.154.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.155.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.155.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.155.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.155.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.155.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.156.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.156.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.156.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.156.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.156.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.157.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.157.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.157.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.157.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.157.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.158.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.158.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.158.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.158.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.158.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.159.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.159.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.159.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.159.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.159.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.160.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.160.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.160.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.160.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.160.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.160.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.161.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.161.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.161.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.161.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.161.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.161.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.162.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.162.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.162.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.162.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.162.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.162.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.163.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.163.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.163.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.163.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.163.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.163.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.164.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.164.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.164.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.164.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.164.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.164.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.165.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.165.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.165.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.165.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.165.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.165.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.166.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.166.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.166.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.166.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.166.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.166.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.167.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.167.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.167.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.167.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.167.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.167.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.168.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.168.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.168.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.168.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.168.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.168.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.169.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.169.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.169.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.169.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.169.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.169.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.170.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.170.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.170.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.170.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.170.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.170.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.171.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.171.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.171.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.171.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.171.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.171.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.172.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.172.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.172.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.172.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.172.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.172.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.173.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.173.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.173.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.173.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.173.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.173.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.174.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.174.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.174.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.174.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.174.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.174.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.175.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.175.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.175.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.175.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.175.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.175.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.176.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.176.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.176.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.176.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.176.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.176.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.177.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.177.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.177.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.177.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.177.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.177.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.178.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.178.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.178.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.178.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.178.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.178.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.179.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.179.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.179.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.179.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.179.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.179.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.180.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.180.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.180.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.180.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.180.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.180.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.181.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.181.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.181.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.181.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.181.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.181.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.182.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.182.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.182.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.182.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.182.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.182.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.183.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.183.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.183.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.183.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.183.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.183.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.184.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.184.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.184.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.184.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.184.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.184.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.185.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.185.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.185.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.185.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.185.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.185.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.186.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.186.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.186.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.186.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.186.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.186.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.187.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.187.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.187.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.187.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.187.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.187.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.188.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.188.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.188.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.188.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.188.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.188.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.189.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.189.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.189.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.189.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.189.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.189.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.190.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.190.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.190.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.190.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.190.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.190.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.191.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.191.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.191.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.191.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.191.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.191.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.192.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.192.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.192.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.192.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.192.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.192.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.193.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.193.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.193.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.193.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.193.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.193.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.194.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.194.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.194.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.194.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.194.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.194.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.195.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.195.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.195.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.195.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.195.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.195.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.196.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.196.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.196.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.196.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.196.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.196.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.197.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.197.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.197.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.197.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.197.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.197.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.198.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.198.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.198.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.198.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.198.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.198.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.199.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.199.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.199.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.199.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.199.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.199.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.200.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.200.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.200.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.200.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.200.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.200.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.201.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.201.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.201.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.201.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.201.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.201.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.202.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.202.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.202.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.202.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.202.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.202.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.203.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.203.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.203.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.203.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.203.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.203.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.204.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.204.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.204.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.204.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.204.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.204.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.205.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.205.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.205.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.205.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.205.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.205.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.206.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.206.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.206.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.206.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.206.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.206.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.207.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.207.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.207.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.207.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.207.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.207.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.208.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.208.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.208.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.208.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.208.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.208.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.209.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.209.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.209.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.209.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.209.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.209.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.210.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.210.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.210.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.210.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.210.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.210.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.211.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.211.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.211.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.211.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.211.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.211.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.212.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.212.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.212.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.212.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.212.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.212.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.213.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.213.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.213.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.213.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.213.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.213.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.214.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.214.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.214.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.214.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.214.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.214.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.215.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.215.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.215.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.215.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.215.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.215.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.216.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.216.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.216.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.216.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.216.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.216.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.217.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.217.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.217.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.217.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.217.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.217.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.218.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.218.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.218.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.218.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.218.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.218.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.219.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.219.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.219.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.219.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.219.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.219.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.220.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.220.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.220.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.220.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.220.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.220.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.221.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.221.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.221.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.221.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.221.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.221.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.222.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.222.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.222.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.222.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.222.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.222.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.223.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.223.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.223.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.223.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.223.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.223.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.224.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.224.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.224.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.224.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.224.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.224.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.225.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.225.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.225.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.225.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.225.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.225.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.226.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.226.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.226.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.226.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.226.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.226.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.227.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.227.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.227.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.227.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.227.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.227.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.228.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.228.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.228.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.228.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.228.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.228.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.229.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.229.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.229.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.229.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.229.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.229.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.230.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.230.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.230.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.230.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.230.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.230.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.231.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.231.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.231.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.231.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.231.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.231.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.232.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.232.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.232.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.232.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.232.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.232.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.233.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.233.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.233.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.233.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.233.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.233.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.234.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.234.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.234.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.234.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.234.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.234.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.235.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.235.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.235.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.235.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.235.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.235.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.236.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.236.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.236.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.236.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.236.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.236.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.237.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.237.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.237.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.237.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.237.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.237.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.238.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.238.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.238.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.238.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.238.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.238.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.239.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.239.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.239.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.239.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.239.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.239.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.240.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.240.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.240.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.240.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.240.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.240.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.241.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.241.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.241.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.241.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.241.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.241.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.242.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.242.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.242.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.242.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.242.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.242.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.243.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.243.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.243.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.243.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.243.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.243.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.244.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.244.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.244.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.244.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.244.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.244.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.245.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.245.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.245.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.245.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.245.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.245.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.246.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.246.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.246.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.246.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.246.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.246.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.247.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.247.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.247.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.247.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.247.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.247.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.248.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.248.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.248.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.248.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.248.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.248.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.249.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.249.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.249.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.249.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.249.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.249.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.250.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.250.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.250.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.250.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.250.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.250.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.251.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.251.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.251.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.251.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.251.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.251.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.252.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.252.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.252.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.252.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.252.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.252.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.253.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.253.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.253.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.253.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.253.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.253.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.254.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.254.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.254.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.254.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.254.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.254.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.255.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.255.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.255.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.255.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.255.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.255.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.input_layernorm.weight": "model-00100-of-000163.safetensors", "model.layers.38.post_attention_layernorm.weight": "model-00100-of-000163.safetensors", "model.layers.39.self_attn.q_a_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.q_a_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.q_a_layernorm.weight": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.q_b_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.q_b_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.kv_b_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.kv_b_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.o_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.o_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.gate.weight": "model-00101-of-000163.safetensors", "model.layers.39.mlp.gate.e_score_correction_bias": "model-00101-of-000163.safetensors", "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.shared_experts.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.shared_experts.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.0.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.0.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.0.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.0.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.0.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.1.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.1.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.1.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.1.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.1.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.2.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.2.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.2.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.2.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.2.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.3.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.3.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.3.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.3.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.3.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.4.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.4.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.4.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.4.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.4.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.5.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.5.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.5.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.5.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.5.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.6.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.6.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.6.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.6.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.6.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.7.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.7.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.7.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.7.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.7.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.8.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.8.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.8.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.8.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.8.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.9.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.9.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.9.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.9.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.9.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.10.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.10.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.10.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.10.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.10.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.11.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.11.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.11.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.11.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.11.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.12.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.12.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.12.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.12.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.12.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.13.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.13.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.13.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.13.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.13.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.14.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.14.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.14.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.14.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.14.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.15.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.15.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.15.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.15.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.15.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.16.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.16.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.16.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.16.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.16.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.17.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.17.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.17.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.17.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.17.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.18.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.18.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.18.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.18.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.18.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.19.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.19.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.19.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.19.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.19.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.20.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.20.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.20.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.20.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.20.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.21.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.21.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.21.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.21.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.21.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.22.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.22.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.22.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.22.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.22.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.23.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.23.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.23.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.23.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.23.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.24.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.24.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.24.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.24.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.24.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.25.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.25.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.25.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.25.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.25.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.26.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.26.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.26.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.26.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.26.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.27.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.27.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.27.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.27.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.27.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.28.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.28.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.28.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.28.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.28.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.29.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.29.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.29.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.29.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.29.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.30.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.30.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.30.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.30.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.30.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.31.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.31.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.31.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.31.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.31.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.32.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.32.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.32.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.32.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.32.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.33.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.33.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.33.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.33.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.33.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.34.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.34.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.34.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.34.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.34.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.35.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.35.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.35.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.35.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.35.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.36.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.36.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.36.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.36.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.36.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.37.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.37.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.37.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.37.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.37.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.38.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.38.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.38.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.38.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.38.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.39.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.39.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.39.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.39.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.39.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.40.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.40.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.40.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.40.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.40.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.41.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.41.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.41.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.41.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.41.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.42.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.42.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.42.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.42.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.42.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.43.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.43.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.43.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.43.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.43.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.44.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.44.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.44.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.44.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.44.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.45.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.45.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.45.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.45.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.45.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.46.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.46.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.46.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.46.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.46.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.47.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.47.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.47.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.47.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.47.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.48.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.48.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.48.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.48.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.48.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.49.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.49.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.49.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.49.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.49.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.50.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.50.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.50.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.50.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.50.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.51.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.51.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.51.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.51.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.51.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.52.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.52.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.52.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.52.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.52.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.53.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.53.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.53.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.53.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.53.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.54.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.54.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.54.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.54.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.54.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.55.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.55.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.55.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.55.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.55.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.56.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.56.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.56.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.56.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.56.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.57.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.57.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.57.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.57.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.57.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.58.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.58.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.58.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.58.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.58.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.59.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.59.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.59.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.59.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.59.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.60.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.60.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.60.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.60.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.60.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.61.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.61.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.61.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.61.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.61.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.62.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.62.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.62.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.62.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.62.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.63.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.63.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.63.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.63.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.63.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.64.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.64.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.64.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.64.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.64.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.65.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.65.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.65.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.65.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.65.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.66.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.66.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.66.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.66.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.66.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.67.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.67.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.67.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.67.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.67.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.68.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.68.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.68.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.68.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.68.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.69.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.69.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.69.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.69.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.69.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.70.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.70.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.70.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.70.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.70.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.71.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.71.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.71.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.71.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.71.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.72.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.72.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.72.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.72.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.72.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.73.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.73.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.73.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.73.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.73.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.74.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.74.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.74.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.74.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.74.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.75.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.75.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.75.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.75.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.75.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.76.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.76.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.76.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.76.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.76.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.77.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.77.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.77.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.77.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.77.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.78.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.78.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.78.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.78.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.78.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.79.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.79.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.79.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.79.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.79.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.80.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.80.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.80.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.80.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.80.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.81.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.81.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.81.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.81.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.81.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.82.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.82.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.82.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.82.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.82.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.83.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.83.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.83.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.83.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.83.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.84.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.84.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.84.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.84.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.84.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.85.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.85.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.85.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.85.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.85.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.86.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.86.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.86.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.86.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.86.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.87.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.87.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.87.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.87.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.87.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.88.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.88.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.88.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.88.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.88.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.89.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.89.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.89.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.89.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.89.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.90.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.90.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.90.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.90.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.90.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.91.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.91.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.91.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.91.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.91.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.92.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.92.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.92.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.92.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.92.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.93.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.93.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.93.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.93.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.93.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.94.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.94.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.94.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.94.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.94.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.95.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.95.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.95.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.95.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.95.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.96.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.96.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.96.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.96.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.96.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.97.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.97.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.97.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.97.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.97.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.98.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.98.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.98.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.98.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.98.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.99.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.99.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.99.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.99.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.99.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.100.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.100.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.100.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.100.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.100.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.101.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.101.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.101.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.101.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.101.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.102.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.102.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.102.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.102.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.102.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.103.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.103.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.103.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.103.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.103.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.104.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.104.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.104.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.104.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.104.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.105.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.105.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.105.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.105.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.105.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.106.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.106.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.106.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.106.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.106.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.107.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.107.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.107.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.107.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.107.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.108.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.108.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.108.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.108.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.108.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.109.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.109.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.109.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.109.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.109.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.110.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.110.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.110.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.110.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.110.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.111.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.111.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.111.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.111.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.111.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.112.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.112.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.112.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.112.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.112.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.113.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.113.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.113.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.113.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.113.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.114.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.114.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.114.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.114.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.114.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.115.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.115.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.115.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.115.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.115.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.116.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.116.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.116.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.116.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.116.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.117.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.117.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.117.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.117.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.117.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.118.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.118.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.118.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.118.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.118.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.119.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.119.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.119.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.119.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.119.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.120.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.120.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.120.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.120.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.120.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.121.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.121.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.121.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.121.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.121.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.122.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.122.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.122.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.122.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.122.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.123.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.123.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.123.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.123.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.123.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.124.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.124.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.124.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.124.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.124.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.125.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.125.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.125.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.125.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.125.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.126.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.126.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.126.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.126.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.126.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.127.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.127.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.127.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.127.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.127.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.128.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.128.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.128.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.128.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.128.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.129.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.129.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.129.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.129.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.129.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.130.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.130.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.130.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.130.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.130.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.131.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.131.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.131.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.131.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.131.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.132.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.132.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.132.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.132.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.132.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.133.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.133.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.133.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.133.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.133.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.134.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.134.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.134.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.134.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.134.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.135.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.135.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.135.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.135.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.135.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.136.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.136.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.136.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.136.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.136.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.137.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.137.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.137.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.137.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.137.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.138.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.138.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.138.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.138.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.138.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.139.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.139.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.139.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.139.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.139.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.140.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.140.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.140.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.140.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.140.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.141.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.141.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.141.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.141.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.141.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.142.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.142.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.142.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.142.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.142.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.143.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.143.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.143.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.143.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.143.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.144.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.144.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.144.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.144.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.144.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.145.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.145.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.145.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.145.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.145.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.146.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.146.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.146.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.146.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.146.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.147.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.147.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.147.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.147.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.147.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.148.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.148.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.148.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.148.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.148.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.149.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.149.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.149.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.149.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.149.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.150.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.150.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.150.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.150.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.150.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.151.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.151.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.151.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.151.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.151.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.152.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.152.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.152.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.152.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.152.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.153.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.153.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.153.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.153.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.153.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.154.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.154.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.154.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.154.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.154.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.155.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.155.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.155.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.155.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.155.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.156.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.156.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.156.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.156.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.156.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.157.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.157.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.157.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.157.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.157.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.158.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.158.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.158.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.158.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.158.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.159.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.159.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.159.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.159.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.159.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.160.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.160.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.160.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.160.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.160.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.160.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.161.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.161.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.161.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.161.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.161.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.161.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.162.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.162.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.162.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.162.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.162.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.162.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.163.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.163.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.163.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.163.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.163.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.163.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.164.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.164.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.164.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.164.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.164.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.164.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.165.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.165.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.165.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.165.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.165.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.165.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.166.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.166.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.166.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.166.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.166.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.166.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.167.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.167.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.167.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.167.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.167.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.167.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.168.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.168.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.168.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.168.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.168.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.168.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.169.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.169.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.169.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.169.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.169.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.169.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.170.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.170.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.170.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.170.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.170.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.170.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.171.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.171.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.171.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.171.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.171.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.171.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.172.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.172.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.172.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.172.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.172.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.172.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.173.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.173.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.173.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.173.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.173.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.173.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.174.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.174.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.174.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.174.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.174.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.174.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.175.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.175.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.175.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.175.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.175.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.175.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.176.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.176.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.176.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.176.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.176.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.176.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.177.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.177.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.177.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.177.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.177.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.177.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.178.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.178.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.178.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.178.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.178.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.178.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.179.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.179.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.179.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.179.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.179.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.179.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.180.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.180.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.180.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.180.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.180.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.180.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.181.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.181.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.181.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.181.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.181.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.181.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.182.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.182.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.182.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.182.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.182.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.182.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.183.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.183.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.183.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.183.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.183.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.183.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.184.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.184.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.184.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.184.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.184.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.184.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.185.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.185.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.185.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.185.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.185.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.185.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.186.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.186.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.186.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.186.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.186.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.186.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.187.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.187.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.187.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.187.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.187.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.187.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.188.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.188.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.188.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.188.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.188.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.188.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.189.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.189.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.189.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.189.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.189.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.189.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.190.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.190.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.190.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.190.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.190.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.190.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.191.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.191.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.191.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.191.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.191.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.191.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.192.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.192.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.192.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.192.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.192.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.192.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.193.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.193.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.193.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.193.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.193.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.193.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.194.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.194.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.194.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.194.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.194.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.194.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.195.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.195.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.195.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.195.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.195.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.195.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.196.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.196.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.196.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.196.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.196.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.196.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.197.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.197.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.197.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.197.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.197.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.197.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.198.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.198.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.198.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.198.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.198.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.198.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.199.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.199.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.199.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.199.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.199.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.199.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.200.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.200.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.200.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.200.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.200.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.200.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.201.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.201.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.201.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.201.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.201.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.201.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.202.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.202.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.202.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.202.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.202.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.202.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.203.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.203.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.203.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.203.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.203.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.203.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.204.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.204.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.204.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.204.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.204.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.204.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.205.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.205.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.205.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.205.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.205.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.205.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.206.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.206.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.206.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.206.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.206.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.206.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.207.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.207.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.207.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.207.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.207.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.207.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.208.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.208.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.208.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.208.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.208.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.208.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.209.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.209.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.209.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.209.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.209.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.209.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.210.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.210.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.210.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.210.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.210.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.210.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.211.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.211.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.211.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.211.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.211.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.211.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.212.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.212.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.212.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.212.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.212.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.212.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.213.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.213.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.213.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.213.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.213.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.213.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.214.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.214.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.214.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.214.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.214.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.214.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.215.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.215.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.215.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.215.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.215.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.215.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.216.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.216.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.216.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.216.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.216.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.216.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.217.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.217.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.217.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.217.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.217.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.217.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.218.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.218.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.218.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.218.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.218.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.218.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.219.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.219.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.219.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.219.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.219.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.219.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.220.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.220.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.220.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.220.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.220.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.220.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.221.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.221.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.221.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.221.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.221.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.221.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.222.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.222.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.222.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.222.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.222.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.222.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.223.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.223.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.223.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.223.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.223.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.223.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.224.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.224.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.224.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.224.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.224.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.224.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.225.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.225.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.225.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.225.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.225.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.225.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.226.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.226.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.226.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.226.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.226.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.226.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.227.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.227.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.227.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.227.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.227.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.227.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.228.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.228.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.228.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.228.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.228.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.228.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.229.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.229.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.229.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.229.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.229.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.229.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.230.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.230.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.230.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.230.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.230.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.230.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.231.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.231.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.231.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.231.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.231.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.231.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.232.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.232.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.232.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.232.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.232.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.232.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.233.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.233.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.233.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.233.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.233.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.233.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.234.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.234.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.234.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.234.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.234.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.234.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.235.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.235.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.235.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.235.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.235.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.235.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.236.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.236.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.236.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.236.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.236.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.236.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.237.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.237.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.237.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.237.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.237.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.237.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.238.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.238.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.238.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.238.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.238.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.238.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.239.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.239.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.239.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.239.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.239.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.239.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.240.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.240.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.240.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.240.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.240.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.240.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.241.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.241.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.241.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.241.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.241.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.241.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.242.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.242.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.242.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.242.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.242.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.242.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.243.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.243.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.243.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.243.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.243.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.243.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.244.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.244.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.244.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.244.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.244.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.244.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.245.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.245.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.245.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.245.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.245.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.245.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.246.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.246.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.246.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.246.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.246.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.246.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.247.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.247.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.247.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.247.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.247.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.247.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.248.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.248.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.248.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.248.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.248.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.248.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.249.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.249.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.249.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.249.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.249.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.249.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.250.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.250.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.250.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.250.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.250.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.250.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.251.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.251.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.251.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.251.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.251.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.251.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.252.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.252.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.252.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.252.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.252.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.252.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.253.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.253.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.253.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.253.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.253.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.253.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.254.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.254.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.254.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.254.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.254.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.254.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.255.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.255.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.255.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.255.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.255.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.255.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.input_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.39.post_attention_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.q_a_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.q_a_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.q_a_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.q_b_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.q_b_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.kv_b_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.kv_b_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.o_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.o_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.gate.weight": "model-00103-of-000163.safetensors", "model.layers.40.mlp.gate.e_score_correction_bias": "model-00103-of-000163.safetensors", "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.shared_experts.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.shared_experts.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.0.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.0.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.0.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.0.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.0.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.1.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.1.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.1.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.1.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.1.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.2.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.2.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.2.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.2.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.2.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.3.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.3.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.3.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.3.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.3.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.4.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.4.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.4.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.4.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.4.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.5.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.5.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.5.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.5.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.5.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.6.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.6.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.6.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.6.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.6.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.7.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.7.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.7.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.7.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.7.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.8.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.8.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.8.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.8.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.8.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.9.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.9.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.9.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.9.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.9.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.10.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.10.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.10.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.10.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.10.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.11.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.11.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.11.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.11.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.11.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.12.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.12.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.12.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.12.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.12.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.13.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.13.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.13.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.13.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.13.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.14.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.14.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.14.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.14.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.14.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.15.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.15.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.15.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.15.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.15.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.16.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.16.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.16.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.16.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.16.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.17.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.17.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.17.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.17.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.17.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.18.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.18.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.18.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.18.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.18.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.19.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.19.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.19.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.19.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.19.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.20.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.20.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.20.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.20.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.20.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.21.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.21.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.21.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.21.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.21.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.22.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.22.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.22.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.22.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.22.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.23.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.23.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.23.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.23.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.23.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.24.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.24.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.24.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.24.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.24.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.25.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.25.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.25.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.25.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.25.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.26.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.26.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.26.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.26.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.26.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.27.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.27.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.27.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.27.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.27.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.28.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.28.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.28.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.28.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.28.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.29.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.29.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.29.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.29.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.29.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.30.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.30.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.30.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.30.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.30.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.31.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.31.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.31.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.31.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.31.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.32.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.32.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.32.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.32.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.32.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.33.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.33.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.33.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.33.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.33.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.34.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.34.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.34.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.34.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.34.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.35.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.35.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.35.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.35.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.35.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.36.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.36.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.36.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.36.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.36.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.37.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.37.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.37.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.37.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.37.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.38.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.38.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.38.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.38.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.38.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.39.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.39.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.39.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.39.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.39.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.40.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.40.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.40.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.40.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.40.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.41.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.41.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.41.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.41.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.41.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.42.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.42.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.42.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.42.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.42.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.43.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.43.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.43.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.43.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.43.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.44.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.44.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.44.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.44.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.44.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.45.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.45.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.45.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.45.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.45.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.46.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.46.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.46.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.46.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.46.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.47.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.47.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.47.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.47.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.47.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.48.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.48.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.48.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.48.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.48.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.49.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.49.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.49.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.49.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.49.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.50.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.50.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.50.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.50.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.50.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.51.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.51.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.51.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.51.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.51.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.52.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.52.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.52.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.52.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.52.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.53.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.53.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.53.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.53.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.53.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.54.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.54.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.54.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.54.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.54.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.55.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.55.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.55.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.55.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.55.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.56.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.56.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.56.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.56.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.56.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.57.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.57.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.57.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.57.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.57.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.58.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.58.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.58.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.58.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.58.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.59.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.59.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.59.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.59.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.59.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.60.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.60.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.60.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.60.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.60.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.61.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.61.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.61.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.61.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.61.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.62.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.62.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.62.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.62.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.62.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.63.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.63.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.63.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.63.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.63.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.64.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.64.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.64.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.64.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.64.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.65.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.65.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.65.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.65.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.65.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.66.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.66.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.66.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.66.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.66.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.67.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.67.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.67.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.67.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.67.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.68.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.68.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.68.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.68.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.68.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.69.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.69.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.69.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.69.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.69.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.70.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.70.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.70.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.70.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.70.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.71.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.71.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.71.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.71.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.71.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.72.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.72.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.72.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.72.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.72.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.73.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.73.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.73.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.73.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.73.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.74.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.74.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.74.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.74.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.74.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.75.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.75.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.75.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.75.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.75.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.76.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.76.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.76.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.76.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.76.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.77.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.77.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.77.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.77.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.77.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.78.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.78.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.78.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.78.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.78.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.79.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.79.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.79.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.79.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.79.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.80.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.80.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.80.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.80.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.80.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.81.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.81.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.81.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.81.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.81.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.82.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.82.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.82.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.82.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.82.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.83.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.83.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.83.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.83.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.83.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.84.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.84.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.84.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.84.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.84.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.85.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.85.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.85.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.85.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.85.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.86.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.86.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.86.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.86.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.86.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.87.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.87.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.87.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.87.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.87.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.88.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.88.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.88.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.88.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.88.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.89.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.89.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.89.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.89.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.89.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.90.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.90.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.90.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.90.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.90.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.91.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.91.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.91.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.91.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.91.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.92.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.92.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.92.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.92.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.92.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.93.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.93.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.93.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.93.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.93.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.94.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.94.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.94.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.94.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.94.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.95.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.95.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.95.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.95.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.95.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.96.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.96.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.96.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.96.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.96.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.97.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.97.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.97.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.97.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.97.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.98.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.98.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.98.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.98.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.98.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.99.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.99.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.99.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.99.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.99.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.100.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.100.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.100.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.100.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.100.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.101.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.101.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.101.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.101.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.101.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.102.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.102.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.102.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.102.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.102.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.103.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.103.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.103.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.103.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.103.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.104.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.104.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.104.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.104.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.104.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.105.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.105.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.105.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.105.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.105.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.106.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.106.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.106.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.106.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.106.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.107.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.107.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.107.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.107.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.107.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.108.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.108.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.108.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.108.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.108.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.109.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.109.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.109.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.109.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.109.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.110.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.110.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.110.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.110.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.110.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.111.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.111.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.111.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.111.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.111.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.112.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.112.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.112.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.112.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.112.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.113.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.113.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.113.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.113.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.113.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.114.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.114.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.114.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.114.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.114.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.115.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.115.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.115.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.115.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.115.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.116.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.116.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.116.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.116.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.116.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.117.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.117.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.117.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.117.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.117.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.118.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.118.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.118.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.118.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.118.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.119.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.119.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.119.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.119.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.119.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.120.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.120.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.120.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.120.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.120.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.121.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.121.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.121.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.121.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.121.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.122.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.122.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.122.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.122.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.122.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.123.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.123.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.123.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.123.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.123.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.124.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.124.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.124.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.124.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.124.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.125.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.125.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.125.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.125.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.125.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.126.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.126.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.126.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.126.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.126.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.127.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.127.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.127.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.127.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.127.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.128.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.128.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.128.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.128.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.128.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.129.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.129.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.129.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.129.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.129.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.130.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.130.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.130.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.130.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.130.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.131.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.131.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.131.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.131.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.131.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.132.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.132.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.132.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.132.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.132.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.133.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.133.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.133.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.133.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.133.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.134.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.134.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.134.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.134.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.134.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.135.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.135.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.135.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.135.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.135.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.136.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.136.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.136.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.136.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.136.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.137.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.137.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.137.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.137.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.137.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.138.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.138.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.138.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.138.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.138.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.139.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.139.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.139.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.139.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.139.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.140.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.140.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.140.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.140.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.140.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.141.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.141.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.141.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.141.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.141.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.142.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.142.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.142.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.142.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.142.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.143.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.143.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.143.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.143.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.143.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.144.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.144.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.144.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.144.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.144.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.145.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.145.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.145.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.145.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.145.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.146.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.146.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.146.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.146.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.146.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.147.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.147.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.147.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.147.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.147.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.148.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.148.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.148.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.148.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.148.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.149.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.149.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.149.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.149.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.149.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.150.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.150.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.150.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.150.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.150.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.151.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.151.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.151.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.151.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.151.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.152.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.152.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.152.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.152.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.152.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.153.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.153.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.153.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.153.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.153.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.154.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.154.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.154.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.154.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.154.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.155.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.155.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.155.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.155.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.155.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.156.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.156.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.156.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.156.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.156.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.157.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.157.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.157.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.157.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.157.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.158.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.158.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.158.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.158.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.158.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.159.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.159.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.159.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.159.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.159.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.160.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.160.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.160.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.160.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.160.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.160.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.161.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.161.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.161.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.161.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.161.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.161.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.162.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.162.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.162.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.162.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.162.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.162.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.163.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.163.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.163.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.163.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.163.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.163.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.164.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.164.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.164.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.164.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.164.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.164.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.165.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.165.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.165.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.165.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.165.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.165.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.166.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.166.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.166.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.166.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.166.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.166.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.167.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.167.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.167.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.167.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.167.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.167.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.168.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.168.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.168.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.168.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.168.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.168.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.169.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.169.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.169.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.169.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.169.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.169.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.170.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.170.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.170.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.170.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.170.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.170.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.171.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.171.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.171.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.171.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.171.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.171.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.172.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.172.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.172.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.172.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.172.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.172.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.173.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.173.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.173.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.173.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.173.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.173.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.174.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.174.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.174.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.174.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.174.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.174.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.175.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.175.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.175.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.175.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.175.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.175.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.176.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.176.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.176.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.176.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.176.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.176.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.177.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.177.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.177.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.177.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.177.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.177.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.178.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.178.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.178.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.178.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.178.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.178.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.179.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.179.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.179.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.179.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.179.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.179.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.180.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.180.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.180.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.180.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.180.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.180.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.181.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.181.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.181.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.181.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.181.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.181.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.182.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.182.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.182.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.182.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.182.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.182.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.183.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.183.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.183.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.183.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.183.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.183.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.184.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.184.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.184.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.184.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.184.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.184.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.185.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.185.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.185.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.185.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.185.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.185.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.186.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.186.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.186.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.186.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.186.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.186.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.187.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.187.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.187.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.187.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.187.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.187.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.188.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.188.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.188.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.188.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.188.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.188.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.189.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.189.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.189.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.189.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.189.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.189.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.190.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.190.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.190.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.190.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.190.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.190.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.191.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.191.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.191.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.191.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.191.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.191.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.192.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.192.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.192.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.192.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.192.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.192.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.193.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.193.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.193.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.193.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.193.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.193.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.194.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.194.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.194.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.194.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.194.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.194.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.195.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.195.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.195.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.195.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.195.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.195.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.196.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.196.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.196.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.196.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.196.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.196.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.197.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.197.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.197.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.197.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.197.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.197.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.198.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.198.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.198.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.198.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.198.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.198.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.199.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.199.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.199.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.199.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.199.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.199.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.200.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.200.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.200.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.200.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.200.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.200.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.201.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.201.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.201.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.201.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.201.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.201.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.202.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.202.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.202.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.202.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.202.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.202.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.203.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.203.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.203.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.203.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.203.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.203.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.204.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.204.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.204.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.204.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.204.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.204.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.205.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.205.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.205.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.205.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.205.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.205.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.206.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.206.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.206.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.206.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.206.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.206.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.207.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.207.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.207.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.207.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.207.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.207.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.208.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.208.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.208.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.208.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.208.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.208.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.209.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.209.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.209.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.209.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.209.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.209.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.210.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.210.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.210.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.210.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.210.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.210.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.211.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.211.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.211.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.211.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.211.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.211.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.212.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.212.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.212.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.212.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.212.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.212.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.213.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.213.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.213.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.213.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.213.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.213.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.214.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.214.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.214.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.214.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.214.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.214.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.215.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.215.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.215.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.215.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.215.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.215.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.216.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.216.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.216.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.216.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.216.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.216.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.217.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.217.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.217.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.217.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.217.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.217.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.218.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.218.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.218.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.218.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.218.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.218.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.219.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.219.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.219.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.219.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.219.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.219.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.220.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.220.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.220.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.220.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.220.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.220.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.221.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.221.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.221.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.221.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.221.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.221.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.222.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.222.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.222.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.222.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.222.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.222.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.223.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.223.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.223.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.223.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.223.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.223.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.224.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.224.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.224.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.224.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.224.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.224.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.225.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.225.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.225.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.225.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.225.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.225.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.226.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.226.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.226.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.226.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.226.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.226.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.227.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.227.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.227.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.227.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.227.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.227.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.228.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.228.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.228.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.228.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.228.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.228.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.229.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.229.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.229.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.229.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.229.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.229.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.230.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.230.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.230.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.230.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.230.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.230.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.231.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.231.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.231.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.231.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.231.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.231.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.232.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.232.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.232.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.232.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.232.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.232.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.233.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.233.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.233.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.233.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.233.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.233.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.234.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.234.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.234.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.234.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.234.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.234.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.235.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.235.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.235.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.235.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.235.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.235.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.236.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.236.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.236.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.236.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.236.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.236.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.237.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.237.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.237.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.237.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.237.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.237.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.238.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.238.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.238.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.238.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.238.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.238.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.239.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.239.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.239.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.239.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.239.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.239.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.240.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.240.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.240.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.240.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.240.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.240.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.241.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.241.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.241.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.241.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.241.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.241.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.242.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.242.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.242.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.242.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.242.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.242.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.243.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.243.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.243.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.243.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.243.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.243.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.244.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.244.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.244.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.244.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.244.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.244.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.245.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.245.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.245.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.245.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.245.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.245.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.246.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.246.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.246.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.246.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.246.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.246.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.247.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.247.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.247.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.247.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.247.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.247.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.248.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.248.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.248.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.248.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.248.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.248.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.249.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.249.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.249.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.249.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.249.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.249.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.250.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.250.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.250.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.250.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.250.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.250.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.251.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.251.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.251.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.251.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.251.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.251.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.252.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.252.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.252.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.252.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.252.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.252.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.253.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.253.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.253.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.253.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.253.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.253.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.254.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.254.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.254.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.254.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.254.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.254.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.255.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.255.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.255.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.255.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.255.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.255.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.input_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.40.post_attention_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.q_a_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.q_a_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.q_a_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.q_b_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.q_b_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.kv_b_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.kv_b_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.o_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.o_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.gate.weight": "model-00106-of-000163.safetensors", "model.layers.41.mlp.gate.e_score_correction_bias": "model-00106-of-000163.safetensors", "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.shared_experts.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.shared_experts.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.0.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.0.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.0.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.0.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.0.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.1.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.1.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.1.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.1.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.1.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.2.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.2.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.2.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.2.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.2.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.3.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.3.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.3.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.3.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.3.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.4.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.4.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.4.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.4.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.4.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.5.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.5.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.5.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.5.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.5.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.6.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.6.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.6.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.6.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.6.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.7.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.7.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.7.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.7.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.7.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.8.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.8.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.8.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.8.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.8.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.9.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.9.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.9.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.9.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.9.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.10.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.10.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.10.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.10.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.10.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.11.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.11.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.11.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.11.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.11.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.12.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.12.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.12.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.12.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.12.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.13.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.13.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.13.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.13.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.13.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.14.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.14.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.14.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.14.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.14.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.15.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.15.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.15.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.15.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.15.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.16.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.16.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.16.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.16.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.16.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.17.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.17.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.17.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.17.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.17.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.18.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.18.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.18.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.18.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.18.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.19.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.19.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.19.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.19.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.19.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.20.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.20.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.20.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.20.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.20.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.21.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.21.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.21.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.21.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.21.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.22.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.22.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.22.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.22.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.22.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.23.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.23.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.23.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.23.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.23.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.24.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.24.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.24.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.24.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.24.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.25.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.25.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.25.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.25.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.25.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.26.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.26.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.26.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.26.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.26.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.27.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.27.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.27.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.27.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.27.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.28.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.28.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.28.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.28.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.28.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.29.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.29.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.29.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.29.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.29.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.30.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.30.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.30.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.30.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.30.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.31.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.31.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.31.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.31.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.31.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.32.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.32.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.32.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.32.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.32.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.33.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.33.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.33.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.33.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.33.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.34.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.34.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.34.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.34.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.34.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.35.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.35.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.35.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.35.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.35.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.36.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.36.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.36.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.36.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.36.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.37.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.37.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.37.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.37.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.37.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.38.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.38.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.38.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.38.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.38.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.39.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.39.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.39.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.39.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.39.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.40.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.40.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.40.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.40.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.40.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.41.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.41.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.41.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.41.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.41.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.42.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.42.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.42.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.42.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.42.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.43.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.43.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.43.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.43.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.43.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.44.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.44.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.44.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.44.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.44.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.45.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.45.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.45.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.45.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.45.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.46.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.46.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.46.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.46.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.46.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.47.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.47.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.47.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.47.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.47.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.48.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.48.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.48.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.48.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.48.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.49.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.49.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.49.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.49.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.49.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.50.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.50.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.50.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.50.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.50.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.51.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.51.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.51.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.51.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.51.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.52.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.52.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.52.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.52.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.52.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.53.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.53.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.53.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.53.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.53.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.54.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.54.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.54.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.54.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.54.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.55.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.55.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.55.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.55.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.55.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.56.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.56.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.56.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.56.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.56.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.57.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.57.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.57.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.57.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.57.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.58.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.58.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.58.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.58.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.58.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.59.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.59.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.59.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.59.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.59.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.60.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.60.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.60.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.60.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.60.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.61.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.61.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.61.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.61.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.61.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.62.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.62.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.62.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.62.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.62.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.63.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.63.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.63.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.63.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.63.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.64.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.64.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.64.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.64.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.64.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.65.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.65.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.65.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.65.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.65.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.66.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.66.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.66.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.66.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.66.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.67.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.67.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.67.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.67.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.67.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.68.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.68.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.68.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.68.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.68.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.69.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.69.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.69.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.69.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.69.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.70.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.70.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.70.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.70.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.70.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.71.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.71.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.71.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.71.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.71.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.72.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.72.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.72.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.72.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.72.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.73.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.73.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.73.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.73.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.73.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.74.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.74.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.74.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.74.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.74.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.75.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.75.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.75.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.75.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.75.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.76.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.76.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.76.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.76.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.76.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.77.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.77.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.77.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.77.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.77.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.78.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.78.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.78.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.78.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.78.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.79.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.79.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.79.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.79.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.79.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.80.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.80.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.80.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.80.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.80.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.81.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.81.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.81.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.81.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.81.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.82.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.82.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.82.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.82.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.82.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.83.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.83.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.83.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.83.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.83.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.84.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.84.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.84.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.84.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.84.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.85.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.85.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.85.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.85.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.85.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.86.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.86.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.86.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.86.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.86.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.87.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.87.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.87.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.87.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.87.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.88.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.88.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.88.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.88.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.88.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.89.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.89.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.89.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.89.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.89.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.90.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.90.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.90.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.90.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.90.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.91.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.91.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.91.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.91.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.91.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.92.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.92.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.92.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.92.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.92.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.93.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.93.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.93.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.93.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.93.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.94.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.94.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.94.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.94.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.94.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.95.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.95.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.95.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.95.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.95.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.96.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.96.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.96.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.96.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.96.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.97.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.97.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.97.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.97.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.97.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.98.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.98.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.98.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.98.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.98.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.99.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.99.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.99.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.99.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.99.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.100.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.100.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.100.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.100.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.100.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.101.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.101.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.101.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.101.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.101.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.102.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.102.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.102.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.102.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.102.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.103.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.103.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.103.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.103.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.103.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.104.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.104.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.104.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.104.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.104.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.105.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.105.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.105.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.105.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.105.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.106.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.106.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.106.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.106.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.106.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.107.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.107.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.107.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.107.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.107.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.108.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.108.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.108.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.108.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.108.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.109.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.109.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.109.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.109.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.109.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.110.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.110.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.110.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.110.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.110.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.111.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.111.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.111.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.111.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.111.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.112.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.112.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.112.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.112.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.112.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.113.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.113.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.113.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.113.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.113.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.114.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.114.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.114.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.114.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.114.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.115.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.115.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.115.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.115.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.115.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.116.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.116.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.116.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.116.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.116.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.117.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.117.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.117.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.117.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.117.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.118.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.118.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.118.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.118.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.118.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.119.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.119.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.119.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.119.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.119.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.120.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.120.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.120.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.120.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.120.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.121.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.121.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.121.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.121.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.121.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.122.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.122.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.122.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.122.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.122.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.123.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.123.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.123.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.123.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.123.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.124.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.124.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.124.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.124.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.124.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.125.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.125.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.125.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.125.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.125.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.126.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.126.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.126.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.126.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.126.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.127.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.127.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.127.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.127.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.127.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.128.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.128.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.128.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.128.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.128.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.129.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.129.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.129.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.129.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.129.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.130.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.130.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.130.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.130.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.130.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.131.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.131.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.131.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.131.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.131.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.132.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.132.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.132.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.132.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.132.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.133.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.133.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.133.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.133.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.133.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.134.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.134.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.134.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.134.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.134.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.135.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.135.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.135.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.135.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.135.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.136.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.136.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.136.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.136.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.136.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.137.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.137.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.137.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.137.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.137.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.138.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.138.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.138.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.138.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.138.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.139.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.139.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.139.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.139.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.139.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.140.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.140.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.140.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.140.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.140.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.141.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.141.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.141.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.141.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.141.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.142.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.142.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.142.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.142.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.142.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.143.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.143.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.143.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.143.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.143.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.144.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.144.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.144.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.144.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.144.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.145.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.145.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.145.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.145.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.145.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.146.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.146.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.146.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.146.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.146.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.147.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.147.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.147.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.147.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.147.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.148.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.148.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.148.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.148.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.148.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.149.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.149.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.149.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.149.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.149.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.150.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.150.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.150.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.150.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.150.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.151.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.151.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.151.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.151.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.151.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.152.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.152.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.152.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.152.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.152.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.153.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.153.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.153.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.153.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.153.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.154.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.154.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.154.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.154.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.154.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.155.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.155.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.155.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.155.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.155.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.156.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.156.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.156.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.156.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.156.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.157.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.157.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.157.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.157.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.157.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.158.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.158.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.158.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.158.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.158.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.159.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.159.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.159.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.159.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.159.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.160.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.160.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.160.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.160.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.160.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.160.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.161.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.161.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.161.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.161.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.161.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.161.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.162.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.162.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.162.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.162.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.162.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.162.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.163.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.163.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.163.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.163.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.163.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.163.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.164.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.164.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.164.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.164.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.164.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.164.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.165.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.165.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.165.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.165.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.165.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.165.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.166.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.166.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.166.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.166.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.166.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.166.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.167.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.167.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.167.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.167.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.167.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.167.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.168.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.168.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.168.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.168.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.168.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.168.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.169.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.169.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.169.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.169.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.169.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.169.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.170.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.170.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.170.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.170.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.170.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.170.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.171.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.171.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.171.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.171.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.171.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.171.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.172.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.172.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.172.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.172.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.172.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.172.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.173.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.173.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.173.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.173.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.173.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.173.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.174.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.174.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.174.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.174.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.174.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.174.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.175.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.175.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.175.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.175.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.175.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.175.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.176.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.176.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.176.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.176.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.176.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.176.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.177.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.177.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.177.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.177.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.177.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.177.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.178.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.178.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.178.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.178.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.178.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.178.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.179.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.179.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.179.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.179.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.179.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.179.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.180.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.180.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.180.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.180.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.180.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.180.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.181.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.181.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.181.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.181.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.181.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.181.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.182.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.182.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.182.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.182.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.182.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.182.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.183.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.183.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.183.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.183.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.183.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.183.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.184.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.184.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.184.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.184.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.184.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.184.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.185.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.185.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.185.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.185.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.185.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.185.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.186.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.186.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.186.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.186.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.186.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.186.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.187.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.187.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.187.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.187.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.187.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.187.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.188.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.188.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.188.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.188.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.188.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.188.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.189.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.189.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.189.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.189.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.189.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.189.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.190.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.190.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.190.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.190.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.190.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.190.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.191.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.191.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.191.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.191.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.191.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.191.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.192.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.192.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.192.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.192.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.192.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.192.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.193.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.193.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.193.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.193.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.193.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.193.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.194.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.194.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.194.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.194.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.194.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.194.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.195.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.195.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.195.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.195.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.195.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.195.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.196.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.196.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.196.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.196.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.196.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.196.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.197.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.197.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.197.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.197.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.197.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.197.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.198.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.198.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.198.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.198.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.198.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.198.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.199.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.199.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.199.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.199.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.199.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.199.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.200.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.200.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.200.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.200.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.200.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.200.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.201.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.201.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.201.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.201.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.201.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.201.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.202.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.202.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.202.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.202.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.202.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.202.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.203.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.203.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.203.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.203.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.203.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.203.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.204.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.204.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.204.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.204.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.204.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.204.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.205.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.205.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.205.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.205.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.205.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.205.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.206.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.206.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.206.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.206.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.206.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.206.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.207.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.207.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.207.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.207.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.207.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.207.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.208.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.208.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.208.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.208.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.208.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.208.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.209.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.209.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.209.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.209.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.209.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.209.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.210.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.210.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.210.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.210.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.210.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.210.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.211.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.211.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.211.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.211.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.211.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.211.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.212.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.212.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.212.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.212.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.212.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.212.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.213.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.213.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.213.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.213.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.213.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.213.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.214.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.214.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.214.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.214.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.214.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.214.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.215.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.215.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.215.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.215.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.215.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.215.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.216.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.216.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.216.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.216.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.216.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.216.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.217.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.217.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.217.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.217.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.217.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.217.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.218.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.218.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.218.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.218.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.218.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.218.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.219.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.219.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.219.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.219.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.219.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.219.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.220.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.220.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.220.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.220.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.220.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.220.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.221.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.221.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.221.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.221.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.221.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.221.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.222.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.222.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.222.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.222.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.222.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.222.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.223.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.223.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.223.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.223.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.223.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.223.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.224.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.224.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.224.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.224.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.224.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.224.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.225.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.225.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.225.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.225.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.225.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.225.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.226.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.226.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.226.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.226.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.226.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.226.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.227.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.227.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.227.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.227.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.227.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.227.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.228.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.228.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.228.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.228.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.228.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.228.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.229.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.229.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.229.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.229.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.229.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.229.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.230.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.230.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.230.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.230.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.230.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.230.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.231.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.231.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.231.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.231.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.231.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.231.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.232.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.232.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.232.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.232.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.232.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.232.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.233.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.233.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.233.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.233.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.233.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.233.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.234.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.234.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.234.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.234.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.234.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.234.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.235.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.235.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.235.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.235.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.235.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.235.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.236.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.236.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.236.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.236.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.236.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.236.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.237.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.237.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.237.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.237.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.237.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.237.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.238.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.238.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.238.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.238.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.238.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.238.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.239.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.239.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.239.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.239.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.239.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.239.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.240.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.240.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.240.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.240.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.240.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.240.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.241.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.241.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.241.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.241.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.241.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.241.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.242.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.242.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.242.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.242.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.242.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.242.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.243.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.243.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.243.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.243.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.243.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.243.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.244.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.244.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.244.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.244.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.244.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.244.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.245.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.245.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.245.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.245.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.245.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.245.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.246.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.246.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.246.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.246.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.246.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.246.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.247.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.247.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.247.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.247.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.247.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.247.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.248.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.248.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.248.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.248.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.248.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.248.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.249.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.249.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.249.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.249.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.249.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.249.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.250.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.250.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.250.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.250.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.250.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.250.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.251.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.251.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.251.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.251.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.251.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.251.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.252.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.252.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.252.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.252.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.252.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.252.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.253.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.253.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.253.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.253.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.253.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.253.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.254.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.254.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.254.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.254.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.254.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.254.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.255.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.255.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.255.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.255.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.255.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.255.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.input_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.41.post_attention_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.q_a_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.q_a_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.q_a_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.q_b_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.q_b_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.kv_b_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.kv_b_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.o_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.o_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.gate.weight": "model-00109-of-000163.safetensors", "model.layers.42.mlp.gate.e_score_correction_bias": "model-00109-of-000163.safetensors", "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.shared_experts.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.shared_experts.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.0.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.0.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.0.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.0.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.0.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.1.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.1.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.1.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.1.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.1.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.2.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.2.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.2.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.2.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.2.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.3.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.3.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.3.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.3.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.3.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.4.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.4.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.4.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.4.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.4.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.5.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.5.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.5.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.5.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.5.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.6.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.6.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.6.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.6.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.6.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.7.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.7.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.7.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.7.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.7.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.8.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.8.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.8.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.8.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.8.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.9.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.9.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.9.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.9.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.9.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.10.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.10.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.10.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.10.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.10.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.11.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.11.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.11.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.11.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.11.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.12.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.12.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.12.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.12.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.12.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.13.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.13.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.13.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.13.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.13.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.14.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.14.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.14.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.14.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.14.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.15.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.15.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.15.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.15.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.15.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.16.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.16.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.16.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.16.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.16.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.17.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.17.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.17.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.17.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.17.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.18.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.18.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.18.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.18.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.18.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.19.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.19.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.19.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.19.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.19.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.20.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.20.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.20.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.20.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.20.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.21.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.21.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.21.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.21.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.21.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.22.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.22.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.22.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.22.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.22.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.23.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.23.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.23.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.23.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.23.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.24.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.24.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.24.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.24.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.24.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.25.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.25.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.25.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.25.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.25.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.26.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.26.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.26.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.26.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.26.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.27.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.27.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.27.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.27.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.27.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.28.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.28.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.28.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.28.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.28.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.29.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.29.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.29.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.29.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.29.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.30.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.30.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.30.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.30.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.30.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.31.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.31.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.31.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.31.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.31.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.32.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.32.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.32.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.32.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.32.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.33.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.33.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.33.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.33.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.33.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.34.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.34.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.34.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.34.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.34.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.35.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.35.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.35.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.35.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.35.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.36.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.36.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.36.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.36.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.36.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.37.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.37.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.37.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.37.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.37.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.38.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.38.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.38.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.38.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.38.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.39.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.39.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.39.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.39.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.39.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.40.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.40.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.40.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.40.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.40.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.41.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.41.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.41.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.41.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.41.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.42.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.42.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.42.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.42.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.42.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.43.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.43.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.43.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.43.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.43.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.44.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.44.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.44.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.44.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.44.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.45.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.45.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.45.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.45.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.45.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.46.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.46.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.46.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.46.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.46.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.47.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.47.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.47.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.47.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.47.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.48.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.48.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.48.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.48.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.48.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.49.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.49.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.49.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.49.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.49.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.50.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.50.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.50.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.50.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.50.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.51.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.51.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.51.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.51.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.51.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.52.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.52.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.52.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.52.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.52.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.53.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.53.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.53.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.53.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.53.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.54.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.54.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.54.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.54.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.54.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.55.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.55.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.55.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.55.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.55.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.56.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.56.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.56.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.56.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.56.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.57.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.57.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.57.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.57.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.57.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.58.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.58.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.58.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.58.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.58.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.59.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.59.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.59.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.59.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.59.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.60.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.60.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.60.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.60.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.60.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.61.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.61.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.61.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.61.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.61.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.62.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.62.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.62.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.62.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.62.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.63.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.63.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.63.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.63.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.63.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.64.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.64.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.64.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.64.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.64.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.65.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.65.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.65.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.65.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.65.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.66.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.66.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.66.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.66.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.66.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.67.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.67.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.67.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.67.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.67.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.68.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.68.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.68.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.68.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.68.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.69.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.69.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.69.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.69.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.69.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.70.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.70.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.70.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.70.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.70.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.71.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.71.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.71.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.71.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.71.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.72.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.72.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.72.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.72.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.72.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.73.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.73.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.73.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.73.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.73.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.74.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.74.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.74.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.74.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.74.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.75.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.75.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.75.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.75.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.75.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.76.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.76.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.76.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.76.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.76.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.77.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.77.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.77.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.77.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.77.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.78.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.78.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.78.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.78.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.78.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.79.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.79.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.79.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.79.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.79.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.80.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.80.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.80.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.80.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.80.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.81.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.81.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.81.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.81.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.81.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.82.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.82.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.82.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.82.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.82.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.83.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.83.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.83.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.83.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.83.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.84.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.84.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.84.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.84.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.84.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.85.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.85.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.85.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.85.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.85.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.86.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.86.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.86.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.86.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.86.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.87.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.87.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.87.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.87.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.87.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.88.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.88.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.88.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.88.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.88.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.89.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.89.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.89.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.89.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.89.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.90.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.90.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.90.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.90.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.90.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.91.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.91.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.91.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.91.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.91.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.92.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.92.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.92.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.92.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.92.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.93.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.93.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.93.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.93.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.93.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.94.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.94.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.94.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.94.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.94.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.95.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.95.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.95.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.95.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.95.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.96.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.96.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.96.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.96.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.96.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.97.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.97.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.97.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.97.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.97.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.98.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.98.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.98.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.98.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.98.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.99.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.99.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.99.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.99.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.99.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.100.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.100.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.100.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.100.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.100.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.101.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.101.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.101.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.101.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.101.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.102.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.102.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.102.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.102.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.102.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.103.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.103.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.103.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.103.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.103.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.104.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.104.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.104.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.104.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.104.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.105.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.105.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.105.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.105.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.105.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.106.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.106.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.106.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.106.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.106.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.107.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.107.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.107.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.107.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.107.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.108.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.108.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.108.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.108.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.108.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.109.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.109.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.109.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.109.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.109.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.110.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.110.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.110.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.110.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.110.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.111.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.111.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.111.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.111.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.111.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.112.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.112.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.112.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.112.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.112.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.113.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.113.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.113.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.113.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.113.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.114.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.114.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.114.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.114.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.114.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.115.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.115.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.115.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.115.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.115.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.116.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.116.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.116.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.116.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.116.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.117.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.117.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.117.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.117.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.117.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.118.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.118.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.118.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.118.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.118.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.119.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.119.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.119.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.119.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.119.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.120.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.120.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.120.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.120.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.120.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.121.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.121.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.121.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.121.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.121.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.122.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.122.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.122.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.122.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.122.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.123.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.123.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.123.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.123.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.123.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.124.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.124.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.124.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.124.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.124.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.125.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.125.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.125.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.125.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.125.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.126.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.126.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.126.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.126.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.126.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.127.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.127.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.127.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.127.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.127.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.128.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.128.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.128.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.128.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.128.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.129.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.129.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.129.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.129.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.129.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.130.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.130.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.130.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.130.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.130.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.131.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.131.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.131.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.131.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.131.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.132.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.132.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.132.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.132.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.132.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.133.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.133.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.133.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.133.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.133.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.134.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.134.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.134.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.134.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.134.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.135.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.135.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.135.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.135.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.135.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.136.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.136.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.136.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.136.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.136.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.137.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.137.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.137.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.137.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.137.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.138.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.138.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.138.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.138.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.138.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.139.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.139.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.139.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.139.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.139.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.140.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.140.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.140.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.140.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.140.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.141.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.141.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.141.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.141.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.141.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.142.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.142.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.142.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.142.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.142.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.143.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.143.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.143.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.143.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.143.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.144.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.144.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.144.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.144.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.144.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.145.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.145.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.145.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.145.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.145.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.146.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.146.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.146.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.146.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.146.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.147.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.147.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.147.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.147.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.147.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.148.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.148.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.148.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.148.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.148.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.149.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.149.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.149.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.149.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.149.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.150.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.150.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.150.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.150.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.150.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.151.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.151.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.151.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.151.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.151.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.152.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.152.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.152.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.152.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.152.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.153.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.153.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.153.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.153.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.153.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.154.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.154.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.154.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.154.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.154.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.155.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.155.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.155.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.155.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.155.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.156.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.156.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.156.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.156.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.156.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.157.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.157.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.157.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.157.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.157.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.158.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.158.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.158.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.158.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.158.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.159.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.159.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.159.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.159.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.159.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.160.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.160.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.160.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.160.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.160.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.160.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.161.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.161.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.161.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.161.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.161.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.161.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.162.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.162.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.162.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.162.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.162.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.162.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.163.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.163.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.163.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.163.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.163.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.163.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.164.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.164.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.164.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.164.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.164.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.164.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.165.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.165.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.165.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.165.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.165.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.165.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.166.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.166.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.166.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.166.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.166.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.166.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.167.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.167.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.167.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.167.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.167.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.167.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.168.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.168.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.168.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.168.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.168.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.168.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.169.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.169.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.169.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.169.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.169.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.169.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.170.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.170.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.170.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.170.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.170.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.170.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.171.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.171.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.171.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.171.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.171.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.171.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.172.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.172.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.172.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.172.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.172.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.172.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.173.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.173.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.173.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.173.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.173.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.173.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.174.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.174.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.174.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.174.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.174.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.174.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.175.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.175.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.175.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.175.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.175.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.175.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.176.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.176.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.176.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.176.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.176.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.176.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.177.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.177.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.177.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.177.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.177.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.177.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.178.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.178.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.178.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.178.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.178.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.178.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.179.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.179.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.179.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.179.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.179.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.179.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.180.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.180.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.180.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.180.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.180.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.180.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.181.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.181.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.181.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.181.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.181.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.181.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.182.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.182.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.182.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.182.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.182.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.182.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.183.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.183.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.183.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.183.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.183.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.183.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.184.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.184.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.184.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.184.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.184.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.184.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.185.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.185.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.185.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.185.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.185.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.185.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.186.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.186.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.186.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.186.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.186.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.186.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.187.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.187.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.187.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.187.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.187.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.187.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.188.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.188.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.188.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.188.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.188.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.188.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.189.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.189.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.189.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.189.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.189.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.189.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.190.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.190.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.190.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.190.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.190.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.190.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.191.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.191.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.191.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.191.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.191.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.191.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.192.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.192.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.192.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.192.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.192.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.192.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.193.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.193.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.193.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.193.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.193.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.193.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.194.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.194.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.194.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.194.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.194.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.194.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.195.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.195.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.195.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.195.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.195.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.195.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.196.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.196.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.196.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.196.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.196.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.196.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.197.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.197.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.197.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.197.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.197.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.197.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.198.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.198.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.198.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.198.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.198.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.198.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.199.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.199.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.199.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.199.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.199.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.199.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.200.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.200.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.200.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.200.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.200.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.200.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.201.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.201.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.201.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.201.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.201.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.201.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.202.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.202.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.202.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.202.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.202.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.202.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.203.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.203.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.203.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.203.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.203.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.203.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.204.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.204.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.204.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.204.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.204.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.204.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.205.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.205.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.205.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.205.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.205.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.205.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.206.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.206.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.206.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.206.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.206.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.206.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.207.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.207.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.207.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.207.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.207.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.207.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.208.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.208.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.208.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.208.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.208.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.208.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.209.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.209.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.209.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.209.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.209.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.209.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.210.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.210.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.210.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.210.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.210.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.210.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.211.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.211.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.211.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.211.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.211.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.211.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.212.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.212.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.212.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.212.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.212.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.212.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.213.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.213.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.213.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.213.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.213.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.213.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.214.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.214.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.214.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.214.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.214.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.214.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.215.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.215.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.215.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.215.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.215.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.215.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.216.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.216.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.216.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.216.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.216.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.216.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.217.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.217.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.217.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.217.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.217.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.217.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.218.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.218.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.218.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.218.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.218.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.218.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.219.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.219.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.219.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.219.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.219.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.219.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.220.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.220.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.220.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.220.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.220.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.220.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.221.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.221.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.221.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.221.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.221.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.221.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.222.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.222.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.222.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.222.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.222.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.222.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.223.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.223.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.223.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.223.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.223.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.223.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.224.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.224.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.224.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.224.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.224.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.224.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.225.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.225.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.225.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.225.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.225.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.225.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.226.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.226.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.226.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.226.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.226.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.226.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.227.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.227.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.227.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.227.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.227.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.227.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.228.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.228.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.228.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.228.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.228.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.228.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.229.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.229.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.229.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.229.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.229.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.229.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.230.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.230.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.230.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.230.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.230.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.230.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.231.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.231.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.231.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.231.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.231.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.231.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.232.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.232.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.232.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.232.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.232.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.232.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.233.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.233.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.233.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.233.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.233.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.233.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.234.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.234.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.234.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.234.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.234.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.234.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.235.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.235.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.235.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.235.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.235.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.235.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.236.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.236.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.236.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.236.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.236.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.236.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.237.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.237.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.237.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.237.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.237.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.237.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.238.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.238.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.238.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.238.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.238.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.238.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.239.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.239.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.239.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.239.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.239.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.239.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.240.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.240.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.240.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.240.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.240.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.240.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.241.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.241.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.241.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.241.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.241.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.241.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.242.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.242.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.242.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.242.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.242.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.242.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.243.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.243.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.243.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.243.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.243.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.243.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.244.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.244.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.244.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.244.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.244.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.244.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.245.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.245.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.245.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.245.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.245.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.245.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.246.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.246.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.246.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.246.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.246.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.246.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.247.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.247.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.247.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.247.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.247.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.247.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.248.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.248.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.248.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.248.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.248.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.248.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.249.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.249.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.249.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.249.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.249.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.249.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.250.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.250.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.250.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.250.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.250.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.250.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.251.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.251.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.251.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.251.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.251.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.251.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.252.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.252.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.252.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.252.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.252.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.252.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.253.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.253.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.253.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.253.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.253.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.253.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.254.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.254.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.254.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.254.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.254.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.254.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.255.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.255.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.255.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.255.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.255.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.255.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.input_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.42.post_attention_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.q_a_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.q_a_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.q_a_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.q_b_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.q_b_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.kv_b_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.kv_b_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.o_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.o_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.gate.weight": "model-00111-of-000163.safetensors", "model.layers.43.mlp.gate.e_score_correction_bias": "model-00111-of-000163.safetensors", "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.shared_experts.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.shared_experts.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.0.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.0.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.0.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.0.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.0.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.1.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.1.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.1.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.1.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.1.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.2.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.2.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.2.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.2.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.2.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.3.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.3.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.3.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.3.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.3.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.4.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.4.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.4.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.4.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.4.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.5.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.5.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.5.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.5.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.5.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.6.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.6.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.6.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.6.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.6.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.7.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.7.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.7.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.7.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.7.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.8.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.8.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.8.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.8.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.8.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.9.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.9.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.9.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.9.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.9.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.10.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.10.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.10.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.10.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.10.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.11.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.11.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.11.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.11.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.11.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.12.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.12.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.12.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.12.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.12.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.13.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.13.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.13.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.13.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.13.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.14.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.14.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.14.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.14.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.14.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.15.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.15.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.15.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.15.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.15.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.16.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.16.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.16.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.16.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.16.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.17.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.17.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.17.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.17.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.17.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.18.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.18.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.18.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.18.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.18.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.19.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.19.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.19.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.19.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.19.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.20.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.20.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.20.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.20.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.20.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.21.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.21.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.21.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.21.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.21.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.22.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.22.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.22.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.22.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.22.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.23.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.23.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.23.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.23.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.23.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.24.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.24.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.24.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.24.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.24.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.25.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.25.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.25.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.25.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.25.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.26.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.26.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.26.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.26.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.26.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.27.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.27.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.27.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.27.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.27.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.28.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.28.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.28.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.28.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.28.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.29.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.29.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.29.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.29.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.29.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.30.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.30.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.30.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.30.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.30.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.31.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.31.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.31.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.31.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.31.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.32.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.32.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.32.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.32.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.32.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.33.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.33.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.33.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.33.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.33.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.34.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.34.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.34.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.34.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.34.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.35.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.35.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.35.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.35.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.35.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.36.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.36.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.36.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.36.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.36.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.37.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.37.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.37.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.37.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.37.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.38.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.38.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.38.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.38.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.38.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.39.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.39.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.39.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.39.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.39.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.40.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.40.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.40.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.40.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.40.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.41.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.41.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.41.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.41.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.41.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.42.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.42.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.42.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.42.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.42.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.43.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.43.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.43.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.43.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.43.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.44.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.44.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.44.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.44.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.44.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.45.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.45.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.45.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.45.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.45.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.46.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.46.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.46.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.46.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.46.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.47.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.47.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.47.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.47.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.47.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.48.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.48.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.48.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.48.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.48.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.49.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.49.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.49.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.49.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.49.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.50.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.50.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.50.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.50.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.50.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.51.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.51.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.51.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.51.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.51.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.52.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.52.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.52.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.52.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.52.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.53.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.53.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.53.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.53.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.53.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.54.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.54.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.54.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.54.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.54.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.55.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.55.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.55.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.55.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.55.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.56.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.56.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.56.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.56.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.56.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.57.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.57.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.57.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.57.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.57.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.58.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.58.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.58.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.58.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.58.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.59.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.59.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.59.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.59.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.59.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.60.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.60.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.60.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.60.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.60.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.61.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.61.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.61.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.61.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.61.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.62.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.62.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.62.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.62.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.62.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.63.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.63.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.63.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.63.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.63.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.64.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.64.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.64.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.64.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.64.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.65.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.65.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.65.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.65.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.65.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.66.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.66.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.66.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.66.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.66.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.67.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.67.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.67.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.67.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.67.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.68.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.68.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.68.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.68.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.68.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.69.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.69.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.69.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.69.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.69.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.70.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.70.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.70.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.70.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.70.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.71.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.71.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.71.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.71.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.71.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.72.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.72.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.72.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.72.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.72.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.73.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.73.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.73.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.73.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.73.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.74.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.74.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.74.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.74.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.74.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.75.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.75.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.75.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.75.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.75.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.76.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.76.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.76.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.76.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.76.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.77.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.77.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.77.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.77.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.77.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.78.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.78.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.78.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.78.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.78.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.79.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.79.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.79.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.79.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.79.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.80.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.80.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.80.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.80.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.80.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.81.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.81.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.81.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.81.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.81.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.82.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.82.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.82.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.82.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.82.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.83.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.83.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.83.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.83.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.83.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.84.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.84.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.84.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.84.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.84.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.85.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.85.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.85.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.85.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.85.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.86.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.86.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.86.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.86.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.86.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.87.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.87.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.87.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.87.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.87.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.88.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.88.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.88.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.88.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.88.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.89.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.89.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.89.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.89.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.89.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.90.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.90.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.90.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.90.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.90.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.91.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.91.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.91.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.91.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.91.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.92.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.92.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.92.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.92.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.92.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.93.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.93.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.93.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.93.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.93.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.94.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.94.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.94.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.94.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.94.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.95.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.95.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.95.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.95.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.95.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.96.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.96.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.96.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.96.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.96.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.97.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.97.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.97.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.97.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.97.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.98.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.98.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.98.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.98.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.98.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.99.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.99.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.99.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.99.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.99.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.100.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.100.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.100.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.100.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.100.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.101.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.101.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.101.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.101.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.101.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.102.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.102.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.102.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.102.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.102.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.103.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.103.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.103.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.103.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.103.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.104.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.104.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.104.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.104.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.104.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.105.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.105.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.105.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.105.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.105.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.106.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.106.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.106.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.106.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.106.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.107.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.107.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.107.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.107.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.107.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.108.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.108.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.108.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.108.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.108.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.109.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.109.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.109.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.109.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.109.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.110.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.110.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.110.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.110.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.110.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.111.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.111.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.111.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.111.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.111.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.112.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.112.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.112.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.112.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.112.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.113.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.113.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.113.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.113.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.113.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.114.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.114.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.114.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.114.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.114.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.115.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.115.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.115.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.115.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.115.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.116.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.116.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.116.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.116.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.116.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.117.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.117.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.117.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.117.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.117.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.118.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.118.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.118.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.118.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.118.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.119.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.119.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.119.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.119.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.119.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.120.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.120.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.120.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.120.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.120.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.121.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.121.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.121.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.121.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.121.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.122.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.122.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.122.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.122.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.122.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.123.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.123.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.123.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.123.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.123.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.124.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.124.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.124.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.124.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.124.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.125.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.125.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.125.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.125.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.125.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.126.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.126.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.126.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.126.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.126.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.127.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.127.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.127.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.127.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.127.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.128.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.128.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.128.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.128.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.128.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.129.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.129.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.129.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.129.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.129.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.130.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.130.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.130.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.130.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.130.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.131.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.131.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.131.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.131.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.131.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.132.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.132.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.132.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.132.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.132.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.133.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.133.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.133.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.133.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.133.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.134.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.134.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.134.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.134.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.134.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.135.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.135.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.135.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.135.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.135.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.136.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.136.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.136.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.136.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.136.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.137.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.137.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.137.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.137.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.137.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.138.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.138.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.138.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.138.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.138.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.139.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.139.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.139.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.139.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.139.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.140.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.140.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.140.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.140.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.140.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.141.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.141.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.141.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.141.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.141.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.142.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.142.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.142.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.142.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.142.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.143.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.143.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.143.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.143.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.143.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.144.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.144.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.144.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.144.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.144.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.145.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.145.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.145.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.145.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.145.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.146.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.146.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.146.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.146.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.146.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.147.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.147.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.147.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.147.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.147.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.148.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.148.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.148.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.148.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.148.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.149.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.149.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.149.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.149.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.149.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.150.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.150.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.150.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.150.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.150.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.151.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.151.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.151.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.151.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.151.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.152.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.152.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.152.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.152.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.152.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.153.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.153.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.153.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.153.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.153.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.154.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.154.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.154.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.154.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.154.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.155.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.155.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.155.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.155.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.155.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.156.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.156.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.156.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.156.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.156.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.157.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.157.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.157.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.157.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.157.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.158.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.158.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.158.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.158.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.158.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.159.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.159.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.159.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.159.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.159.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.160.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.160.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.160.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.160.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.160.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.160.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.161.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.161.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.161.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.161.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.161.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.161.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.162.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.162.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.162.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.162.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.162.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.162.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.163.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.163.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.163.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.163.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.163.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.163.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.164.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.164.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.164.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.164.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.164.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.164.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.165.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.165.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.165.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.165.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.165.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.165.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.166.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.166.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.166.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.166.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.166.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.166.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.167.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.167.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.167.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.167.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.167.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.167.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.168.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.168.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.168.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.168.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.168.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.168.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.169.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.169.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.169.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.169.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.169.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.169.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.170.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.170.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.170.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.170.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.170.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.170.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.171.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.171.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.171.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.171.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.171.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.171.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.172.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.172.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.172.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.172.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.172.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.172.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.173.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.173.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.173.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.173.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.173.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.173.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.174.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.174.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.174.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.174.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.174.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.174.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.175.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.175.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.175.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.175.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.175.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.175.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.176.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.176.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.176.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.176.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.176.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.176.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.177.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.177.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.177.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.177.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.177.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.177.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.178.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.178.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.178.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.178.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.178.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.178.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.179.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.179.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.179.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.179.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.179.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.179.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.180.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.180.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.180.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.180.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.180.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.180.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.181.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.181.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.181.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.181.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.181.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.181.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.182.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.182.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.182.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.182.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.182.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.182.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.183.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.183.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.183.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.183.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.183.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.183.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.184.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.184.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.184.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.184.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.184.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.184.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.185.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.185.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.185.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.185.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.185.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.185.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.186.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.186.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.186.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.186.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.186.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.186.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.187.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.187.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.187.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.187.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.187.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.187.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.188.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.188.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.188.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.188.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.188.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.188.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.189.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.189.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.189.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.189.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.189.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.189.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.190.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.190.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.190.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.190.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.190.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.190.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.191.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.191.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.191.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.191.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.191.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.191.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.192.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.192.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.192.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.192.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.192.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.192.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.193.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.193.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.193.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.193.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.193.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.193.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.194.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.194.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.194.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.194.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.194.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.194.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.195.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.195.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.195.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.195.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.195.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.195.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.196.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.196.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.196.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.196.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.196.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.196.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.197.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.197.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.197.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.197.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.197.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.197.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.198.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.198.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.198.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.198.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.198.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.198.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.199.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.199.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.199.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.199.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.199.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.199.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.200.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.200.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.200.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.200.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.200.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.200.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.201.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.201.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.201.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.201.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.201.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.201.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.202.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.202.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.202.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.202.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.202.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.202.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.203.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.203.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.203.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.203.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.203.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.203.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.204.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.204.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.204.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.204.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.204.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.204.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.205.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.205.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.205.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.205.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.205.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.205.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.206.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.206.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.206.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.206.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.206.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.206.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.207.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.207.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.207.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.207.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.207.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.207.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.208.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.208.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.208.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.208.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.208.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.208.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.209.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.209.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.209.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.209.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.209.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.209.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.210.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.210.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.210.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.210.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.210.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.210.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.211.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.211.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.211.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.211.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.211.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.211.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.212.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.212.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.212.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.212.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.212.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.212.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.213.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.213.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.213.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.213.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.213.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.213.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.214.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.214.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.214.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.214.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.214.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.214.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.215.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.215.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.215.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.215.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.215.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.215.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.216.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.216.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.216.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.216.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.216.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.216.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.217.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.217.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.217.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.217.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.217.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.217.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.218.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.218.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.218.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.218.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.218.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.218.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.219.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.219.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.219.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.219.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.219.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.219.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.220.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.220.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.220.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.220.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.220.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.220.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.221.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.221.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.221.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.221.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.221.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.221.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.222.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.222.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.222.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.222.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.222.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.222.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.223.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.223.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.223.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.223.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.223.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.223.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.224.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.224.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.224.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.224.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.224.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.224.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.225.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.225.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.225.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.225.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.225.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.225.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.226.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.226.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.226.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.226.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.226.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.226.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.227.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.227.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.227.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.227.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.227.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.227.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.228.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.228.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.228.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.228.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.228.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.228.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.229.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.229.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.229.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.229.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.229.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.229.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.230.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.230.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.230.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.230.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.230.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.230.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.231.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.231.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.231.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.231.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.231.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.231.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.232.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.232.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.232.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.232.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.232.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.232.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.233.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.233.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.233.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.233.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.233.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.233.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.234.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.234.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.234.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.234.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.234.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.234.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.235.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.235.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.235.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.235.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.235.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.235.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.236.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.236.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.236.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.236.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.236.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.236.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.237.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.237.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.237.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.237.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.237.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.237.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.238.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.238.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.238.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.238.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.238.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.238.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.239.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.239.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.239.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.239.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.239.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.239.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.240.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.240.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.240.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.240.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.240.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.240.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.241.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.241.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.241.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.241.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.241.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.241.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.242.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.242.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.242.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.242.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.242.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.242.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.243.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.243.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.243.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.243.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.243.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.243.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.244.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.244.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.244.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.244.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.244.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.244.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.245.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.245.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.245.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.245.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.245.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.245.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.246.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.246.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.246.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.246.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.246.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.246.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.247.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.247.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.247.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.247.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.247.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.247.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.248.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.248.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.248.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.248.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.248.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.248.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.249.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.249.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.249.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.249.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.249.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.249.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.250.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.250.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.250.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.250.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.250.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.250.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.251.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.251.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.251.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.251.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.251.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.251.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.252.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.252.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.252.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.252.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.252.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.252.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.253.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.253.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.253.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.253.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.253.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.253.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.254.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.254.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.254.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.254.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.254.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.254.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.255.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.255.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.255.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.255.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.255.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.255.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.input_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.43.post_attention_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.q_a_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.q_a_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.q_a_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.q_b_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.q_b_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.kv_b_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.kv_b_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.o_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.o_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.gate.weight": "model-00114-of-000163.safetensors", "model.layers.44.mlp.gate.e_score_correction_bias": "model-00114-of-000163.safetensors", "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.shared_experts.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.shared_experts.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.0.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.0.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.0.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.0.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.0.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.1.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.1.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.1.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.1.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.1.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.2.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.2.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.2.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.2.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.2.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.3.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.3.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.3.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.3.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.3.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.4.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.4.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.4.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.4.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.4.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.5.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.5.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.5.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.5.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.5.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.6.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.6.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.6.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.6.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.6.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.7.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.7.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.7.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.7.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.7.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.8.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.8.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.8.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.8.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.8.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.9.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.9.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.9.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.9.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.9.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.10.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.10.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.10.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.10.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.10.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.11.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.11.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.11.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.11.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.11.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.12.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.12.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.12.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.12.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.12.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.13.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.13.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.13.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.13.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.13.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.14.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.14.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.14.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.14.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.14.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.15.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.15.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.15.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.15.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.15.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.16.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.16.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.16.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.16.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.16.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.17.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.17.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.17.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.17.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.17.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.18.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.18.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.18.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.18.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.18.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.19.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.19.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.19.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.19.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.19.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.20.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.20.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.20.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.20.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.20.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.21.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.21.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.21.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.21.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.21.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.22.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.22.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.22.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.22.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.22.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.23.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.23.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.23.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.23.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.23.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.24.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.24.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.24.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.24.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.24.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.25.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.25.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.25.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.25.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.25.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.26.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.26.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.26.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.26.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.26.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.27.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.27.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.27.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.27.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.27.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.28.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.28.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.28.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.28.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.28.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.29.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.29.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.29.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.29.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.29.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.30.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.30.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.30.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.30.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.30.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.31.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.31.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.31.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.31.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.31.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.32.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.32.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.32.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.32.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.32.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.33.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.33.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.33.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.33.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.33.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.34.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.34.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.34.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.34.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.34.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.35.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.35.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.35.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.35.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.35.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.36.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.36.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.36.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.36.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.36.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.37.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.37.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.37.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.37.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.37.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.38.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.38.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.38.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.38.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.38.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.39.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.39.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.39.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.39.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.39.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.40.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.40.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.40.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.40.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.40.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.41.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.41.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.41.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.41.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.41.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.42.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.42.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.42.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.42.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.42.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.43.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.43.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.43.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.43.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.43.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.44.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.44.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.44.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.44.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.44.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.45.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.45.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.45.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.45.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.45.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.46.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.46.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.46.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.46.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.46.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.47.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.47.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.47.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.47.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.47.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.48.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.48.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.48.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.48.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.48.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.49.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.49.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.49.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.49.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.49.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.50.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.50.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.50.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.50.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.50.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.51.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.51.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.51.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.51.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.51.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.52.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.52.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.52.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.52.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.52.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.53.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.53.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.53.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.53.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.53.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.54.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.54.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.54.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.54.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.54.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.55.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.55.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.55.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.55.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.55.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.56.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.56.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.56.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.56.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.56.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.57.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.57.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.57.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.57.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.57.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.58.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.58.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.58.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.58.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.58.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.59.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.59.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.59.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.59.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.59.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.60.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.60.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.60.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.60.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.60.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.61.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.61.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.61.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.61.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.61.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.62.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.62.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.62.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.62.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.62.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.63.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.63.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.63.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.63.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.63.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.64.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.64.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.64.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.64.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.64.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.65.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.65.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.65.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.65.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.65.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.66.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.66.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.66.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.66.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.66.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.67.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.67.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.67.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.67.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.67.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.68.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.68.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.68.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.68.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.68.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.69.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.69.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.69.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.69.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.69.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.70.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.70.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.70.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.70.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.70.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.71.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.71.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.71.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.71.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.71.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.72.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.72.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.72.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.72.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.72.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.73.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.73.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.73.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.73.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.73.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.74.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.74.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.74.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.74.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.74.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.75.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.75.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.75.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.75.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.75.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.76.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.76.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.76.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.76.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.76.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.77.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.77.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.77.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.77.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.77.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.78.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.78.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.78.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.78.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.78.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.79.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.79.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.79.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.79.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.79.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.80.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.80.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.80.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.80.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.80.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.81.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.81.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.81.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.81.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.81.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.82.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.82.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.82.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.82.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.82.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.83.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.83.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.83.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.83.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.83.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.84.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.84.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.84.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.84.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.84.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.85.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.85.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.85.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.85.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.85.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.86.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.86.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.86.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.86.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.86.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.87.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.87.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.87.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.87.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.87.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.88.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.88.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.88.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.88.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.88.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.89.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.89.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.89.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.89.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.89.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.90.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.90.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.90.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.90.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.90.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.91.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.91.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.91.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.91.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.91.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.92.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.92.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.92.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.92.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.92.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.93.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.93.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.93.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.93.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.93.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.94.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.94.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.94.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.94.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.94.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.95.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.95.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.95.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.95.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.95.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.96.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.96.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.96.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.96.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.96.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.97.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.97.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.97.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.97.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.97.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.98.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.98.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.98.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.98.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.98.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.99.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.99.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.99.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.99.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.99.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.100.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.100.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.100.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.100.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.100.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.101.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.101.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.101.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.101.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.101.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.102.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.102.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.102.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.102.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.102.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.103.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.103.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.103.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.103.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.103.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.104.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.104.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.104.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.104.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.104.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.105.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.105.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.105.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.105.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.105.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.106.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.106.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.106.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.106.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.106.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.107.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.107.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.107.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.107.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.107.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.108.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.108.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.108.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.108.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.108.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.109.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.109.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.109.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.109.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.109.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.110.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.110.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.110.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.110.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.110.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.111.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.111.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.111.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.111.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.111.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.112.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.112.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.112.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.112.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.112.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.113.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.113.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.113.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.113.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.113.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.114.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.114.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.114.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.114.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.114.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.115.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.115.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.115.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.115.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.115.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.116.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.116.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.116.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.116.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.116.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.117.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.117.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.117.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.117.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.117.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.118.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.118.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.118.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.118.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.118.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.119.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.119.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.119.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.119.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.119.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.120.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.120.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.120.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.120.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.120.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.121.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.121.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.121.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.121.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.121.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.122.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.122.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.122.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.122.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.122.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.123.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.123.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.123.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.123.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.123.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.124.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.124.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.124.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.124.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.124.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.125.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.125.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.125.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.125.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.125.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.126.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.126.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.126.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.126.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.126.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.127.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.127.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.127.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.127.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.127.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.128.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.128.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.128.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.128.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.128.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.129.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.129.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.129.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.129.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.129.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.130.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.130.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.130.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.130.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.130.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.131.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.131.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.131.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.131.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.131.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.132.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.132.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.132.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.132.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.132.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.133.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.133.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.133.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.133.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.133.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.134.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.134.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.134.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.134.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.134.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.135.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.135.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.135.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.135.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.135.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.136.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.136.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.136.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.136.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.136.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.137.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.137.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.137.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.137.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.137.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.138.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.138.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.138.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.138.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.138.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.139.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.139.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.139.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.139.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.139.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.140.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.140.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.140.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.140.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.140.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.141.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.141.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.141.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.141.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.141.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.142.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.142.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.142.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.142.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.142.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.143.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.143.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.143.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.143.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.143.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.144.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.144.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.144.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.144.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.144.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.145.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.145.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.145.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.145.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.145.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.146.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.146.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.146.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.146.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.146.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.147.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.147.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.147.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.147.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.147.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.148.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.148.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.148.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.148.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.148.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.149.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.149.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.149.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.149.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.149.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.150.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.150.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.150.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.150.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.150.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.151.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.151.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.151.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.151.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.151.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.152.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.152.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.152.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.152.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.152.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.153.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.153.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.153.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.153.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.153.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.154.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.154.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.154.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.154.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.154.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.155.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.155.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.155.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.155.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.155.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.156.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.156.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.156.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.156.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.156.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.157.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.157.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.157.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.157.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.157.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.158.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.158.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.158.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.158.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.158.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.159.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.159.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.159.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.159.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.159.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.160.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.160.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.160.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.160.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.160.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.160.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.161.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.161.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.161.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.161.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.161.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.161.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.162.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.162.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.162.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.162.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.162.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.162.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.163.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.163.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.163.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.163.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.163.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.163.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.164.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.164.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.164.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.164.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.164.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.164.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.165.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.165.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.165.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.165.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.165.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.165.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.166.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.166.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.166.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.166.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.166.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.166.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.167.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.167.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.167.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.167.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.167.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.167.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.168.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.168.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.168.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.168.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.168.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.168.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.169.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.169.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.169.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.169.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.169.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.169.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.170.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.170.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.170.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.170.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.170.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.170.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.171.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.171.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.171.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.171.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.171.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.171.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.172.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.172.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.172.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.172.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.172.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.172.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.173.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.173.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.173.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.173.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.173.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.173.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.174.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.174.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.174.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.174.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.174.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.174.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.175.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.175.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.175.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.175.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.175.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.175.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.176.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.176.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.176.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.176.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.176.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.176.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.177.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.177.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.177.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.177.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.177.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.177.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.178.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.178.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.178.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.178.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.178.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.178.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.179.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.179.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.179.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.179.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.179.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.179.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.180.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.180.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.180.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.180.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.180.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.180.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.181.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.181.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.181.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.181.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.181.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.181.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.182.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.182.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.182.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.182.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.182.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.182.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.183.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.183.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.183.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.183.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.183.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.183.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.184.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.184.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.184.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.184.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.184.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.184.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.185.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.185.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.185.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.185.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.185.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.185.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.186.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.186.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.186.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.186.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.186.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.186.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.187.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.187.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.187.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.187.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.187.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.187.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.188.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.188.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.188.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.188.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.188.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.188.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.189.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.189.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.189.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.189.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.189.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.189.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.190.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.190.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.190.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.190.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.190.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.190.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.191.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.191.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.191.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.191.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.191.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.191.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.192.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.192.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.192.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.192.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.192.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.192.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.193.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.193.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.193.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.193.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.193.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.193.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.194.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.194.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.194.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.194.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.194.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.194.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.195.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.195.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.195.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.195.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.195.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.195.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.196.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.196.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.196.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.196.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.196.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.196.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.197.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.197.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.197.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.197.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.197.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.197.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.198.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.198.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.198.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.198.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.198.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.198.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.199.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.199.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.199.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.199.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.199.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.199.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.200.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.200.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.200.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.200.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.200.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.200.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.201.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.201.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.201.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.201.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.201.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.201.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.202.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.202.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.202.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.202.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.202.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.202.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.203.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.203.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.203.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.203.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.203.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.203.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.204.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.204.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.204.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.204.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.204.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.204.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.205.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.205.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.205.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.205.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.205.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.205.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.206.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.206.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.206.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.206.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.206.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.206.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.207.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.207.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.207.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.207.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.207.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.207.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.208.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.208.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.208.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.208.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.208.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.208.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.209.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.209.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.209.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.209.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.209.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.209.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.210.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.210.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.210.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.210.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.210.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.210.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.211.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.211.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.211.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.211.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.211.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.211.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.212.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.212.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.212.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.212.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.212.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.212.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.213.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.213.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.213.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.213.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.213.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.213.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.214.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.214.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.214.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.214.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.214.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.214.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.215.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.215.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.215.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.215.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.215.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.215.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.216.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.216.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.216.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.216.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.216.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.216.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.217.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.217.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.217.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.217.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.217.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.217.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.218.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.218.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.218.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.218.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.218.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.218.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.219.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.219.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.219.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.219.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.219.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.219.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.220.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.220.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.220.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.220.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.220.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.220.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.221.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.221.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.221.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.221.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.221.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.221.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.222.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.222.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.222.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.222.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.222.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.222.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.223.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.223.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.223.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.223.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.223.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.223.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.224.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.224.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.224.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.224.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.224.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.224.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.225.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.225.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.225.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.225.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.225.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.225.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.226.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.226.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.226.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.226.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.226.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.226.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.227.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.227.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.227.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.227.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.227.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.227.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.228.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.228.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.228.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.228.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.228.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.228.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.229.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.229.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.229.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.229.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.229.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.229.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.230.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.230.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.230.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.230.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.230.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.230.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.231.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.231.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.231.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.231.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.231.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.231.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.232.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.232.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.232.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.232.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.232.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.232.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.233.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.233.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.233.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.233.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.233.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.233.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.234.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.234.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.234.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.234.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.234.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.234.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.235.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.235.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.235.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.235.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.235.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.235.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.236.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.236.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.236.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.236.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.236.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.236.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.237.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.237.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.237.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.237.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.237.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.237.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.238.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.238.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.238.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.238.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.238.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.238.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.239.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.239.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.239.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.239.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.239.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.239.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.240.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.240.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.240.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.240.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.240.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.240.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.241.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.241.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.241.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.241.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.241.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.241.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.242.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.242.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.242.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.242.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.242.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.242.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.243.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.243.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.243.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.243.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.243.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.243.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.244.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.244.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.244.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.244.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.244.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.244.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.245.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.245.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.245.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.245.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.245.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.245.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.246.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.246.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.246.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.246.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.246.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.246.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.247.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.247.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.247.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.247.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.247.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.247.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.248.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.248.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.248.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.248.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.248.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.248.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.249.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.249.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.249.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.249.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.249.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.249.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.250.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.250.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.250.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.250.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.250.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.250.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.251.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.251.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.251.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.251.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.251.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.251.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.252.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.252.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.252.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.252.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.252.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.252.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.253.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.253.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.253.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.253.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.253.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.253.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.254.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.254.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.254.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.254.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.254.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.254.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.255.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.255.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.255.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.255.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.255.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.255.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.input_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.44.post_attention_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.q_a_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.q_a_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.q_a_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.q_b_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.q_b_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.kv_b_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.kv_b_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.o_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.o_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.gate.weight": "model-00117-of-000163.safetensors", "model.layers.45.mlp.gate.e_score_correction_bias": "model-00117-of-000163.safetensors", "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.shared_experts.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.shared_experts.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.0.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.0.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.0.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.0.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.0.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.1.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.1.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.1.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.1.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.1.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.2.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.2.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.2.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.2.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.2.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.3.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.3.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.3.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.3.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.3.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.4.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.4.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.4.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.4.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.4.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.5.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.5.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.5.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.5.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.5.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.6.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.6.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.6.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.6.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.6.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.7.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.7.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.7.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.7.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.7.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.8.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.8.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.8.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.8.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.8.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.9.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.9.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.9.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.9.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.9.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.10.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.10.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.10.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.10.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.10.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.11.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.11.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.11.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.11.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.11.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.12.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.12.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.12.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.12.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.12.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.13.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.13.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.13.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.13.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.13.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.14.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.14.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.14.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.14.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.14.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.15.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.15.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.15.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.15.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.15.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.16.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.16.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.16.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.16.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.16.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.17.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.17.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.17.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.17.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.17.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.18.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.18.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.18.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.18.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.18.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.19.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.19.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.19.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.19.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.19.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.20.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.20.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.20.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.20.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.20.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.21.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.21.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.21.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.21.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.21.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.22.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.22.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.22.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.22.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.22.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.23.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.23.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.23.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.23.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.23.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.24.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.24.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.24.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.24.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.24.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.25.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.25.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.25.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.25.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.25.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.26.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.26.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.26.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.26.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.26.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.27.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.27.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.27.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.27.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.27.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.28.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.28.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.28.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.28.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.28.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.29.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.29.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.29.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.29.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.29.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.30.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.30.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.30.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.30.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.30.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.31.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.31.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.31.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.31.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.31.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.32.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.32.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.32.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.32.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.32.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.33.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.33.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.33.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.33.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.33.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.34.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.34.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.34.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.34.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.34.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.35.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.35.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.35.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.35.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.35.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.36.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.36.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.36.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.36.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.36.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.37.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.37.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.37.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.37.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.37.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.38.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.38.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.38.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.38.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.38.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.39.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.39.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.39.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.39.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.39.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.40.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.40.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.40.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.40.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.40.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.41.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.41.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.41.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.41.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.41.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.42.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.42.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.42.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.42.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.42.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.43.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.43.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.43.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.43.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.43.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.44.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.44.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.44.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.44.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.44.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.45.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.45.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.45.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.45.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.45.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.46.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.46.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.46.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.46.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.46.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.47.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.47.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.47.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.47.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.47.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.48.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.48.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.48.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.48.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.48.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.49.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.49.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.49.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.49.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.49.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.50.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.50.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.50.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.50.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.50.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.51.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.51.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.51.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.51.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.51.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.52.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.52.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.52.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.52.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.52.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.53.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.53.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.53.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.53.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.53.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.54.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.54.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.54.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.54.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.54.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.55.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.55.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.55.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.55.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.55.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.56.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.56.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.56.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.56.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.56.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.57.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.57.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.57.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.57.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.57.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.58.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.58.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.58.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.58.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.58.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.59.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.59.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.59.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.59.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.59.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.60.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.60.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.60.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.60.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.60.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.61.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.61.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.61.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.61.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.61.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.62.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.62.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.62.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.62.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.62.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.63.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.63.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.63.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.63.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.63.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.64.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.64.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.64.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.64.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.64.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.65.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.65.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.65.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.65.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.65.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.66.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.66.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.66.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.66.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.66.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.67.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.67.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.67.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.67.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.67.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.68.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.68.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.68.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.68.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.68.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.69.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.69.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.69.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.69.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.69.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.70.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.70.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.70.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.70.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.70.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.71.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.71.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.71.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.71.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.71.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.72.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.72.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.72.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.72.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.72.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.73.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.73.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.73.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.73.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.73.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.74.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.74.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.74.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.74.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.74.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.75.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.75.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.75.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.75.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.75.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.76.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.76.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.76.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.76.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.76.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.77.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.77.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.77.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.77.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.77.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.78.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.78.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.78.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.78.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.78.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.79.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.79.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.79.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.79.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.79.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.80.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.80.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.80.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.80.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.80.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.81.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.81.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.81.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.81.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.81.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.82.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.82.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.82.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.82.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.82.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.83.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.83.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.83.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.83.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.83.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.84.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.84.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.84.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.84.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.84.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.85.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.85.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.85.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.85.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.85.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.86.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.86.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.86.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.86.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.86.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.87.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.87.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.87.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.87.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.87.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.88.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.88.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.88.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.88.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.88.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.89.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.89.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.89.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.89.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.89.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.90.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.90.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.90.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.90.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.90.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.91.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.91.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.91.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.91.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.91.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.92.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.92.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.92.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.92.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.92.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.93.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.93.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.93.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.93.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.93.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.94.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.94.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.94.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.94.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.94.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.95.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.95.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.95.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.95.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.95.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.96.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.96.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.96.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.96.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.96.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.97.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.97.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.97.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.97.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.97.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.98.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.98.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.98.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.98.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.98.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.99.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.99.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.99.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.99.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.99.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.100.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.100.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.100.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.100.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.100.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.101.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.101.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.101.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.101.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.101.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.102.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.102.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.102.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.102.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.102.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.103.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.103.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.103.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.103.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.103.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.104.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.104.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.104.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.104.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.104.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.105.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.105.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.105.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.105.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.105.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.106.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.106.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.106.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.106.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.106.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.107.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.107.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.107.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.107.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.107.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.108.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.108.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.108.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.108.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.108.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.109.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.109.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.109.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.109.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.109.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.110.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.110.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.110.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.110.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.110.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.111.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.111.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.111.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.111.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.111.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.112.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.112.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.112.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.112.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.112.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.113.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.113.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.113.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.113.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.113.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.114.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.114.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.114.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.114.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.114.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.115.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.115.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.115.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.115.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.115.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.116.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.116.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.116.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.116.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.116.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.117.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.117.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.117.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.117.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.117.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.118.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.118.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.118.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.118.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.118.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.119.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.119.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.119.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.119.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.119.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.120.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.120.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.120.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.120.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.120.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.121.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.121.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.121.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.121.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.121.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.122.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.122.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.122.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.122.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.122.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.123.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.123.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.123.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.123.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.123.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.124.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.124.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.124.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.124.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.124.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.125.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.125.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.125.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.125.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.125.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.126.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.126.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.126.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.126.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.126.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.127.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.127.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.127.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.127.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.127.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.128.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.128.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.128.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.128.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.128.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.129.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.129.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.129.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.129.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.129.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.130.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.130.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.130.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.130.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.130.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.131.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.131.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.131.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.131.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.131.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.132.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.132.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.132.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.132.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.132.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.133.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.133.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.133.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.133.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.133.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.134.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.134.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.134.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.134.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.134.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.135.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.135.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.135.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.135.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.135.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.136.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.136.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.136.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.136.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.136.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.137.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.137.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.137.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.137.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.137.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.138.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.138.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.138.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.138.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.138.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.139.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.139.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.139.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.139.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.139.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.140.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.140.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.140.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.140.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.140.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.141.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.141.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.141.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.141.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.141.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.142.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.142.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.142.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.142.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.142.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.143.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.143.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.143.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.143.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.143.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.144.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.144.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.144.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.144.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.144.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.145.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.145.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.145.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.145.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.145.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.146.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.146.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.146.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.146.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.146.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.147.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.147.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.147.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.147.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.147.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.148.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.148.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.148.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.148.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.148.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.149.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.149.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.149.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.149.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.149.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.150.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.150.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.150.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.150.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.150.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.151.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.151.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.151.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.151.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.151.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.152.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.152.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.152.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.152.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.152.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.153.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.153.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.153.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.153.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.153.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.154.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.154.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.154.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.154.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.154.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.155.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.155.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.155.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.155.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.155.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.156.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.156.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.156.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.156.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.156.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.157.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.157.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.157.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.157.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.157.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.158.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.158.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.158.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.158.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.158.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.159.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.159.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.159.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.159.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.159.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.160.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.160.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.160.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.160.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.160.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.160.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.161.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.161.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.161.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.161.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.161.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.161.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.162.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.162.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.162.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.162.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.162.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.162.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.163.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.163.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.163.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.163.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.163.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.163.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.164.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.164.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.164.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.164.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.164.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.164.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.165.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.165.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.165.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.165.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.165.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.165.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.166.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.166.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.166.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.166.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.166.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.166.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.167.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.167.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.167.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.167.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.167.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.167.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.168.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.168.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.168.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.168.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.168.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.168.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.169.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.169.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.169.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.169.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.169.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.169.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.170.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.170.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.170.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.170.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.170.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.170.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.171.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.171.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.171.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.171.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.171.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.171.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.172.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.172.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.172.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.172.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.172.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.172.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.173.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.173.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.173.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.173.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.173.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.173.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.174.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.174.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.174.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.174.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.174.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.174.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.175.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.175.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.175.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.175.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.175.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.175.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.176.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.176.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.176.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.176.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.176.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.176.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.177.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.177.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.177.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.177.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.177.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.177.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.178.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.178.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.178.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.178.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.178.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.178.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.179.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.179.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.179.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.179.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.179.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.179.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.180.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.180.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.180.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.180.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.180.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.180.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.181.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.181.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.181.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.181.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.181.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.181.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.182.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.182.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.182.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.182.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.182.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.182.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.183.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.183.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.183.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.183.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.183.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.183.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.184.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.184.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.184.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.184.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.184.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.184.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.185.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.185.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.185.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.185.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.185.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.185.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.186.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.186.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.186.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.186.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.186.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.186.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.187.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.187.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.187.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.187.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.187.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.187.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.188.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.188.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.188.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.188.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.188.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.188.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.189.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.189.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.189.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.189.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.189.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.189.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.190.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.190.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.190.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.190.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.190.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.190.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.191.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.191.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.191.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.191.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.191.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.191.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.192.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.192.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.192.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.192.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.192.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.192.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.193.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.193.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.193.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.193.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.193.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.193.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.194.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.194.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.194.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.194.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.194.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.194.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.195.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.195.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.195.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.195.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.195.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.195.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.196.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.196.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.196.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.196.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.196.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.196.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.197.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.197.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.197.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.197.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.197.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.197.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.198.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.198.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.198.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.198.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.198.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.198.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.199.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.199.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.199.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.199.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.199.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.199.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.200.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.200.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.200.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.200.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.200.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.200.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.201.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.201.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.201.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.201.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.201.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.201.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.202.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.202.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.202.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.202.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.202.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.202.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.203.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.203.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.203.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.203.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.203.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.203.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.204.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.204.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.204.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.204.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.204.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.204.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.205.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.205.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.205.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.205.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.205.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.205.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.206.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.206.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.206.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.206.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.206.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.206.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.207.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.207.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.207.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.207.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.207.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.207.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.208.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.208.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.208.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.208.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.208.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.208.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.209.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.209.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.209.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.209.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.209.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.209.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.210.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.210.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.210.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.210.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.210.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.210.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.211.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.211.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.211.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.211.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.211.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.211.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.212.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.212.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.212.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.212.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.212.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.212.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.213.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.213.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.213.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.213.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.213.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.213.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.214.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.214.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.214.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.214.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.214.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.214.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.215.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.215.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.215.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.215.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.215.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.215.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.216.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.216.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.216.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.216.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.216.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.216.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.217.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.217.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.217.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.217.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.217.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.217.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.218.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.218.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.218.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.218.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.218.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.218.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.219.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.219.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.219.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.219.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.219.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.219.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.220.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.220.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.220.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.220.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.220.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.220.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.221.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.221.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.221.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.221.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.221.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.221.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.222.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.222.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.222.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.222.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.222.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.222.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.223.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.223.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.223.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.223.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.223.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.223.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.224.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.224.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.224.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.224.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.224.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.224.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.225.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.225.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.225.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.225.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.225.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.225.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.226.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.226.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.226.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.226.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.226.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.226.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.227.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.227.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.227.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.227.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.227.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.227.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.228.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.228.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.228.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.228.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.228.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.228.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.229.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.229.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.229.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.229.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.229.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.229.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.230.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.230.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.230.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.230.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.230.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.230.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.231.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.231.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.231.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.231.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.231.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.231.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.232.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.232.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.232.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.232.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.232.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.232.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.233.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.233.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.233.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.233.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.233.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.233.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.234.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.234.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.234.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.234.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.234.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.234.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.235.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.235.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.235.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.235.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.235.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.235.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.236.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.236.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.236.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.236.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.236.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.236.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.237.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.237.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.237.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.237.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.237.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.237.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.238.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.238.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.238.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.238.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.238.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.238.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.239.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.239.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.239.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.239.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.239.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.239.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.240.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.240.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.240.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.240.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.240.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.240.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.241.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.241.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.241.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.241.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.241.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.241.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.242.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.242.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.242.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.242.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.242.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.242.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.243.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.243.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.243.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.243.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.243.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.243.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.244.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.244.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.244.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.244.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.244.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.244.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.245.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.245.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.245.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.245.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.245.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.245.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.246.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.246.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.246.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.246.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.246.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.246.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.247.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.247.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.247.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.247.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.247.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.247.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.248.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.248.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.248.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.248.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.248.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.248.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.249.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.249.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.249.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.249.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.249.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.249.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.250.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.250.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.250.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.250.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.250.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.250.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.251.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.251.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.251.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.251.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.251.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.251.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.252.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.252.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.252.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.252.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.252.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.252.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.253.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.253.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.253.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.253.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.253.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.253.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.254.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.254.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.254.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.254.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.254.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.254.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.255.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.255.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.255.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.255.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.255.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.255.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.input_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.45.post_attention_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.q_a_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.q_a_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.q_a_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.q_b_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.q_b_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.kv_b_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.kv_b_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.o_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.o_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.gate.weight": "model-00119-of-000163.safetensors", "model.layers.46.mlp.gate.e_score_correction_bias": "model-00119-of-000163.safetensors", "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.shared_experts.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.shared_experts.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.0.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.0.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.0.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.0.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.0.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.1.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.1.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.1.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.1.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.1.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.2.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.2.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.2.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.2.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.2.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.3.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.3.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.3.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.3.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.3.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.4.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.4.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.4.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.4.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.4.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.5.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.5.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.5.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.5.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.5.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.6.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.6.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.6.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.6.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.6.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.7.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.7.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.7.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.7.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.7.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.8.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.8.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.8.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.8.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.8.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.9.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.9.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.9.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.9.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.9.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.10.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.10.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.10.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.10.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.10.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.11.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.11.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.11.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.11.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.11.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.12.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.12.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.12.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.12.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.12.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.13.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.13.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.13.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.13.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.13.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.14.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.14.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.14.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.14.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.14.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.15.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.15.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.15.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.15.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.15.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.16.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.16.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.16.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.16.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.16.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.17.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.17.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.17.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.17.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.17.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.18.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.18.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.18.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.18.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.18.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.19.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.19.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.19.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.19.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.19.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.20.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.20.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.20.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.20.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.20.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.21.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.21.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.21.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.21.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.21.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.22.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.22.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.22.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.22.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.22.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.23.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.23.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.23.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.23.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.23.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.24.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.24.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.24.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.24.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.24.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.25.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.25.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.25.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.25.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.25.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.26.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.26.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.26.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.26.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.26.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.27.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.27.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.27.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.27.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.27.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.28.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.28.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.28.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.28.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.28.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.29.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.29.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.29.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.29.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.29.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.30.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.30.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.30.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.30.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.30.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.31.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.31.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.31.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.31.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.31.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.32.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.32.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.32.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.32.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.32.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.33.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.33.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.33.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.33.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.33.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.34.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.34.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.34.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.34.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.34.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.35.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.35.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.35.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.35.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.35.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.36.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.36.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.36.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.36.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.36.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.37.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.37.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.37.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.37.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.37.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.38.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.38.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.38.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.38.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.38.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.39.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.39.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.39.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.39.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.39.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.40.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.40.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.40.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.40.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.40.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.41.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.41.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.41.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.41.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.41.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.42.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.42.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.42.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.42.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.42.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.43.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.43.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.43.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.43.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.43.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.44.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.44.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.44.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.44.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.44.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.45.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.45.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.45.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.45.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.45.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.46.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.46.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.46.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.46.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.46.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.47.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.47.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.47.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.47.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.47.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.48.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.48.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.48.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.48.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.48.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.49.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.49.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.49.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.49.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.49.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.50.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.50.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.50.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.50.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.50.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.51.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.51.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.51.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.51.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.51.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.52.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.52.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.52.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.52.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.52.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.53.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.53.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.53.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.53.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.53.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.54.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.54.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.54.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.54.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.54.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.55.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.55.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.55.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.55.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.55.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.56.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.56.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.56.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.56.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.56.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.57.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.57.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.57.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.57.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.57.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.58.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.58.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.58.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.58.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.58.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.59.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.59.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.59.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.59.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.59.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.60.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.60.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.60.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.60.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.60.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.61.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.61.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.61.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.61.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.61.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.62.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.62.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.62.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.62.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.62.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.63.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.63.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.63.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.63.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.63.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.64.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.64.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.64.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.64.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.64.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.65.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.65.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.65.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.65.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.65.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.66.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.66.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.66.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.66.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.66.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.67.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.67.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.67.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.67.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.67.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.68.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.68.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.68.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.68.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.68.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.69.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.69.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.69.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.69.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.69.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.70.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.70.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.70.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.70.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.70.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.71.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.71.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.71.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.71.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.71.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.72.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.72.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.72.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.72.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.72.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.73.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.73.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.73.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.73.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.73.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.74.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.74.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.74.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.74.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.74.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.75.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.75.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.75.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.75.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.75.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.76.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.76.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.76.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.76.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.76.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.77.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.77.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.77.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.77.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.77.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.78.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.78.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.78.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.78.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.78.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.79.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.79.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.79.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.79.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.79.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.80.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.80.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.80.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.80.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.80.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.81.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.81.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.81.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.81.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.81.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.82.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.82.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.82.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.82.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.82.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.83.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.83.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.83.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.83.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.83.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.84.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.84.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.84.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.84.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.84.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.85.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.85.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.85.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.85.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.85.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.86.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.86.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.86.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.86.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.86.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.87.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.87.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.87.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.87.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.87.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.88.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.88.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.88.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.88.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.88.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.89.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.89.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.89.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.89.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.89.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.90.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.90.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.90.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.90.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.90.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.91.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.91.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.91.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.91.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.91.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.92.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.92.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.92.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.92.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.92.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.93.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.93.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.93.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.93.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.93.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.94.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.94.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.94.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.94.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.94.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.95.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.95.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.95.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.95.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.95.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.96.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.96.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.96.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.96.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.96.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.97.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.97.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.97.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.97.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.97.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.98.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.98.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.98.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.98.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.98.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.99.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.99.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.99.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.99.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.99.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.100.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.100.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.100.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.100.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.100.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.101.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.101.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.101.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.101.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.101.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.102.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.102.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.102.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.102.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.102.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.103.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.103.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.103.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.103.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.103.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.104.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.104.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.104.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.104.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.104.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.105.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.105.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.105.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.105.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.105.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.106.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.106.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.106.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.106.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.106.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.107.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.107.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.107.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.107.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.107.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.108.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.108.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.108.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.108.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.108.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.109.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.109.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.109.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.109.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.109.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.110.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.110.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.110.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.110.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.110.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.111.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.111.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.111.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.111.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.111.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.112.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.112.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.112.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.112.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.112.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.113.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.113.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.113.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.113.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.113.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.114.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.114.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.114.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.114.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.114.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.115.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.115.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.115.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.115.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.115.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.116.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.116.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.116.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.116.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.116.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.117.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.117.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.117.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.117.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.117.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.118.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.118.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.118.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.118.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.118.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.119.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.119.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.119.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.119.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.119.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.120.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.120.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.120.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.120.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.120.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.121.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.121.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.121.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.121.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.121.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.122.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.122.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.122.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.122.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.122.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.123.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.123.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.123.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.123.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.123.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.124.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.124.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.124.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.124.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.124.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.125.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.125.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.125.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.125.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.125.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.126.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.126.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.126.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.126.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.126.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.127.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.127.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.127.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.127.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.127.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.128.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.128.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.128.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.128.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.128.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.129.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.129.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.129.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.129.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.129.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.130.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.130.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.130.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.130.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.130.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.131.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.131.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.131.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.131.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.131.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.132.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.132.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.132.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.132.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.132.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.133.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.133.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.133.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.133.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.133.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.134.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.134.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.134.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.134.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.134.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.135.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.135.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.135.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.135.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.135.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.136.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.136.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.136.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.136.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.136.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.137.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.137.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.137.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.137.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.137.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.138.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.138.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.138.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.138.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.138.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.139.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.139.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.139.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.139.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.139.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.140.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.140.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.140.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.140.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.140.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.141.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.141.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.141.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.141.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.141.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.142.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.142.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.142.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.142.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.142.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.143.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.143.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.143.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.143.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.143.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.144.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.144.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.144.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.144.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.144.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.145.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.145.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.145.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.145.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.145.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.146.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.146.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.146.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.146.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.146.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.147.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.147.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.147.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.147.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.147.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.148.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.148.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.148.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.148.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.148.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.149.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.149.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.149.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.149.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.149.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.150.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.150.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.150.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.150.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.150.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.151.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.151.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.151.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.151.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.151.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.152.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.152.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.152.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.152.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.152.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.153.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.153.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.153.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.153.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.153.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.154.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.154.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.154.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.154.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.154.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.155.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.155.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.155.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.155.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.155.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.156.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.156.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.156.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.156.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.156.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.157.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.157.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.157.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.157.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.157.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.158.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.158.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.158.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.158.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.158.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.159.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.159.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.159.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.159.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.159.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.160.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.160.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.160.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.160.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.160.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.160.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.161.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.161.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.161.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.161.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.161.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.161.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.162.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.162.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.162.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.162.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.162.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.162.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.163.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.163.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.163.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.163.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.163.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.163.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.164.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.164.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.164.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.164.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.164.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.164.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.165.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.165.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.165.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.165.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.165.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.165.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.166.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.166.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.166.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.166.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.166.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.166.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.167.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.167.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.167.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.167.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.167.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.167.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.168.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.168.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.168.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.168.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.168.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.168.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.169.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.169.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.169.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.169.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.169.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.169.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.170.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.170.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.170.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.170.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.170.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.170.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.171.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.171.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.171.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.171.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.171.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.171.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.172.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.172.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.172.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.172.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.172.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.172.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.173.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.173.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.173.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.173.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.173.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.173.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.174.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.174.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.174.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.174.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.174.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.174.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.175.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.175.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.175.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.175.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.175.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.175.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.176.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.176.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.176.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.176.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.176.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.176.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.177.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.177.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.177.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.177.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.177.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.177.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.178.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.178.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.178.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.178.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.178.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.178.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.179.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.179.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.179.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.179.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.179.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.179.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.180.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.180.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.180.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.180.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.180.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.180.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.181.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.181.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.181.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.181.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.181.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.181.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.182.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.182.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.182.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.182.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.182.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.182.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.183.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.183.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.183.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.183.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.183.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.183.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.184.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.184.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.184.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.184.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.184.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.184.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.185.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.185.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.185.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.185.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.185.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.185.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.186.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.186.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.186.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.186.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.186.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.186.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.187.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.187.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.187.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.187.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.187.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.187.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.188.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.188.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.188.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.188.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.188.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.188.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.189.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.189.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.189.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.189.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.189.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.189.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.190.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.190.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.190.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.190.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.190.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.190.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.191.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.191.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.191.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.191.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.191.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.191.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.192.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.192.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.192.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.192.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.192.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.192.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.193.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.193.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.193.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.193.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.193.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.193.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.194.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.194.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.194.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.194.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.194.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.194.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.195.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.195.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.195.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.195.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.195.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.195.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.196.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.196.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.196.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.196.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.196.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.196.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.197.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.197.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.197.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.197.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.197.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.197.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.198.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.198.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.198.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.198.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.198.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.198.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.199.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.199.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.199.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.199.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.199.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.199.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.200.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.200.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.200.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.200.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.200.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.200.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.201.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.201.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.201.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.201.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.201.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.201.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.202.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.202.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.202.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.202.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.202.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.202.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.203.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.203.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.203.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.203.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.203.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.203.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.204.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.204.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.204.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.204.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.204.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.204.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.205.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.205.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.205.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.205.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.205.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.205.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.206.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.206.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.206.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.206.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.206.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.206.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.207.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.207.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.207.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.207.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.207.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.207.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.208.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.208.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.208.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.208.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.208.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.208.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.209.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.209.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.209.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.209.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.209.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.209.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.210.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.210.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.210.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.210.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.210.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.210.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.211.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.211.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.211.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.211.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.211.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.211.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.212.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.212.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.212.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.212.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.212.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.212.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.213.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.213.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.213.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.213.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.213.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.213.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.214.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.214.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.214.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.214.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.214.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.214.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.215.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.215.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.215.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.215.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.215.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.215.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.216.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.216.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.216.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.216.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.216.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.216.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.217.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.217.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.217.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.217.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.217.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.217.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.218.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.218.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.218.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.218.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.218.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.218.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.219.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.219.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.219.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.219.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.219.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.219.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.220.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.220.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.220.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.220.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.220.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.220.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.221.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.221.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.221.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.221.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.221.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.221.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.222.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.222.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.222.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.222.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.222.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.222.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.223.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.223.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.223.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.223.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.223.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.223.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.224.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.224.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.224.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.224.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.224.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.224.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.225.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.225.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.225.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.225.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.225.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.225.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.226.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.226.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.226.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.226.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.226.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.226.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.227.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.227.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.227.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.227.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.227.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.227.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.228.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.228.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.228.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.228.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.228.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.228.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.229.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.229.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.229.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.229.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.229.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.229.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.230.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.230.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.230.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.230.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.230.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.230.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.231.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.231.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.231.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.231.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.231.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.231.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.232.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.232.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.232.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.232.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.232.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.232.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.233.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.233.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.233.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.233.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.233.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.233.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.234.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.234.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.234.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.234.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.234.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.234.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.235.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.235.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.235.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.235.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.235.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.235.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.236.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.236.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.236.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.236.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.236.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.236.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.237.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.237.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.237.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.237.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.237.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.237.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.238.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.238.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.238.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.238.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.238.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.238.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.239.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.239.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.239.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.239.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.239.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.239.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.240.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.240.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.240.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.240.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.240.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.240.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.241.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.241.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.241.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.241.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.241.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.241.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.242.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.242.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.242.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.242.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.242.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.242.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.243.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.243.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.243.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.243.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.243.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.243.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.244.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.244.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.244.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.244.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.244.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.244.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.245.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.245.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.245.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.245.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.245.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.245.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.246.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.246.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.246.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.246.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.246.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.246.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.247.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.247.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.247.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.247.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.247.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.247.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.248.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.248.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.248.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.248.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.248.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.248.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.249.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.249.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.249.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.249.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.249.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.249.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.250.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.250.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.250.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.250.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.250.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.250.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.251.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.251.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.251.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.251.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.251.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.251.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.252.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.252.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.252.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.252.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.252.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.252.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.253.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.253.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.253.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.253.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.253.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.253.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.254.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.254.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.254.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.254.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.254.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.254.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.255.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.255.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.255.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.255.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.255.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.255.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.input_layernorm.weight": "model-00122-of-000163.safetensors", "model.layers.46.post_attention_layernorm.weight": "model-00122-of-000163.safetensors", "model.layers.47.self_attn.q_a_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.q_a_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.q_a_layernorm.weight": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.q_b_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.q_b_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.kv_b_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.kv_b_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.o_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.o_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.gate.weight": "model-00123-of-000163.safetensors", "model.layers.47.mlp.gate.e_score_correction_bias": "model-00123-of-000163.safetensors", "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.shared_experts.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.shared_experts.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.0.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.0.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.0.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.0.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.0.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.1.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.1.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.1.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.1.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.1.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.2.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.2.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.2.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.2.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.2.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.3.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.3.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.3.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.3.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.3.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.4.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.4.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.4.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.4.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.4.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.5.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.5.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.5.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.5.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.5.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.6.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.6.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.6.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.6.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.6.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.7.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.7.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.7.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.7.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.7.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.8.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.8.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.8.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.8.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.8.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.9.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.9.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.9.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.9.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.9.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.10.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.10.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.10.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.10.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.10.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.11.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.11.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.11.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.11.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.11.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.12.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.12.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.12.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.12.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.12.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.13.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.13.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.13.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.13.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.13.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.14.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.14.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.14.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.14.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.14.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.15.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.15.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.15.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.15.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.15.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.16.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.16.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.16.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.16.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.16.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.17.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.17.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.17.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.17.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.17.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.18.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.18.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.18.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.18.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.18.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.19.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.19.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.19.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.19.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.19.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.20.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.20.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.20.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.20.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.20.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.21.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.21.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.21.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.21.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.21.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.22.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.22.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.22.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.22.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.22.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.23.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.23.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.23.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.23.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.23.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.24.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.24.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.24.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.24.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.24.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.25.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.25.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.25.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.25.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.25.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.26.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.26.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.26.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.26.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.26.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.27.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.27.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.27.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.27.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.27.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.28.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.28.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.28.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.28.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.28.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.29.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.29.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.29.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.29.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.29.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.30.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.30.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.30.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.30.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.30.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.31.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.31.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.31.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.31.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.31.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.32.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.32.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.32.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.32.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.32.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.33.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.33.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.33.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.33.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.33.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.34.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.34.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.34.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.34.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.34.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.35.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.35.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.35.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.35.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.35.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.36.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.36.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.36.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.36.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.36.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.37.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.37.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.37.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.37.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.37.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.38.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.38.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.38.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.38.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.38.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.39.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.39.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.39.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.39.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.39.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.40.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.40.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.40.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.40.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.40.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.41.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.41.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.41.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.41.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.41.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.42.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.42.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.42.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.42.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.42.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.43.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.43.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.43.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.43.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.43.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.44.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.44.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.44.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.44.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.44.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.45.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.45.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.45.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.45.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.45.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.46.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.46.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.46.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.46.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.46.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.47.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.47.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.47.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.47.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.47.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.48.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.48.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.48.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.48.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.48.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.49.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.49.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.49.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.49.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.49.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.50.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.50.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.50.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.50.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.50.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.51.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.51.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.51.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.51.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.51.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.52.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.52.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.52.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.52.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.52.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.53.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.53.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.53.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.53.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.53.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.54.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.54.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.54.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.54.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.54.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.55.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.55.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.55.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.55.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.55.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.56.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.56.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.56.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.56.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.56.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.57.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.57.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.57.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.57.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.57.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.58.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.58.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.58.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.58.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.58.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.59.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.59.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.59.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.59.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.59.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.60.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.60.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.60.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.60.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.60.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.61.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.61.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.61.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.61.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.61.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.62.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.62.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.62.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.62.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.62.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.63.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.63.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.63.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.63.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.63.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.64.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.64.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.64.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.64.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.64.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.65.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.65.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.65.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.65.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.65.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.66.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.66.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.66.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.66.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.66.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.67.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.67.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.67.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.67.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.67.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.68.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.68.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.68.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.68.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.68.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.69.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.69.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.69.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.69.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.69.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.70.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.70.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.70.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.70.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.70.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.71.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.71.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.71.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.71.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.71.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.72.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.72.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.72.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.72.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.72.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.73.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.73.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.73.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.73.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.73.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.74.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.74.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.74.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.74.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.74.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.75.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.75.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.75.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.75.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.75.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.76.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.76.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.76.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.76.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.76.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.77.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.77.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.77.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.77.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.77.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.78.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.78.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.78.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.78.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.78.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.79.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.79.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.79.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.79.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.79.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.80.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.80.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.80.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.80.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.80.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.81.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.81.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.81.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.81.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.81.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.82.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.82.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.82.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.82.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.82.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.83.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.83.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.83.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.83.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.83.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.84.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.84.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.84.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.84.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.84.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.85.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.85.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.85.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.85.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.85.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.86.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.86.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.86.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.86.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.86.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.87.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.87.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.87.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.87.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.87.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.88.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.88.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.88.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.88.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.88.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.89.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.89.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.89.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.89.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.89.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.90.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.90.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.90.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.90.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.90.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.91.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.91.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.91.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.91.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.91.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.92.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.92.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.92.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.92.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.92.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.93.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.93.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.93.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.93.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.93.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.94.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.94.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.94.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.94.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.94.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.95.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.95.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.95.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.95.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.95.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.96.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.96.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.96.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.96.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.96.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.97.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.97.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.97.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.97.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.97.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.98.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.98.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.98.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.98.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.98.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.99.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.99.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.99.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.99.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.99.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.100.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.100.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.100.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.100.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.100.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.101.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.101.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.101.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.101.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.101.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.102.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.102.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.102.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.102.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.102.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.103.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.103.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.103.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.103.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.103.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.104.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.104.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.104.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.104.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.104.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.105.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.105.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.105.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.105.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.105.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.106.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.106.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.106.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.106.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.106.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.107.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.107.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.107.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.107.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.107.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.108.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.108.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.108.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.108.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.108.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.109.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.109.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.109.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.109.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.109.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.110.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.110.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.110.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.110.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.110.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.111.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.111.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.111.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.111.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.111.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.112.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.112.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.112.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.112.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.112.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.113.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.113.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.113.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.113.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.113.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.114.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.114.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.114.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.114.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.114.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.115.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.115.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.115.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.115.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.115.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.116.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.116.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.116.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.116.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.116.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.117.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.117.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.117.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.117.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.117.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.118.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.118.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.118.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.118.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.118.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.119.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.119.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.119.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.119.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.119.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.120.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.120.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.120.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.120.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.120.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.121.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.121.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.121.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.121.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.121.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.122.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.122.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.122.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.122.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.122.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.123.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.123.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.123.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.123.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.123.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.124.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.124.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.124.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.124.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.124.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.125.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.125.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.125.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.125.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.125.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.126.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.126.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.126.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.126.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.126.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.127.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.127.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.127.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.127.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.127.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.128.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.128.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.128.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.128.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.128.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.129.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.129.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.129.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.129.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.129.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.130.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.130.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.130.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.130.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.130.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.131.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.131.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.131.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.131.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.131.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.132.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.132.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.132.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.132.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.132.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.133.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.133.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.133.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.133.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.133.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.134.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.134.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.134.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.134.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.134.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.135.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.135.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.135.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.135.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.135.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.136.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.136.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.136.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.136.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.136.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.137.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.137.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.137.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.137.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.137.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.138.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.138.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.138.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.138.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.138.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.139.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.139.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.139.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.139.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.139.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.140.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.140.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.140.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.140.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.140.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.141.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.141.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.141.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.141.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.141.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.142.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.142.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.142.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.142.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.142.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.143.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.143.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.143.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.143.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.143.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.144.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.144.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.144.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.144.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.144.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.145.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.145.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.145.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.145.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.145.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.146.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.146.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.146.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.146.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.146.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.147.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.147.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.147.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.147.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.147.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.148.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.148.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.148.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.148.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.148.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.149.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.149.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.149.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.149.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.149.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.150.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.150.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.150.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.150.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.150.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.151.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.151.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.151.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.151.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.151.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.152.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.152.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.152.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.152.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.152.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.153.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.153.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.153.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.153.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.153.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.154.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.154.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.154.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.154.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.154.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.155.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.155.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.155.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.155.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.155.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.156.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.156.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.156.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.156.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.156.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.157.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.157.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.157.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.157.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.157.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.158.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.158.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.158.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.158.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.158.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.159.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.159.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.159.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.159.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.159.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.160.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.160.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.160.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.160.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.160.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.160.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.161.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.161.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.161.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.161.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.161.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.161.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.162.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.162.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.162.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.162.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.162.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.162.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.163.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.163.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.163.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.163.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.163.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.163.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.164.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.164.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.164.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.164.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.164.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.164.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.165.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.165.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.165.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.165.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.165.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.165.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.166.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.166.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.166.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.166.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.166.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.166.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.167.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.167.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.167.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.167.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.167.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.167.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.168.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.168.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.168.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.168.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.168.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.168.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.169.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.169.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.169.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.169.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.169.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.169.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.170.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.170.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.170.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.170.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.170.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.170.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.171.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.171.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.171.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.171.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.171.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.171.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.172.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.172.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.172.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.172.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.172.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.172.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.173.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.173.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.173.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.173.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.173.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.173.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.174.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.174.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.174.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.174.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.174.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.174.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.175.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.175.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.175.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.175.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.175.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.175.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.176.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.176.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.176.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.176.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.176.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.176.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.177.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.177.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.177.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.177.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.177.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.177.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.178.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.178.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.178.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.178.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.178.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.178.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.179.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.179.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.179.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.179.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.179.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.179.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.180.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.180.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.180.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.180.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.180.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.180.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.181.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.181.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.181.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.181.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.181.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.181.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.182.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.182.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.182.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.182.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.182.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.182.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.183.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.183.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.183.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.183.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.183.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.183.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.184.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.184.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.184.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.184.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.184.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.184.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.185.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.185.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.185.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.185.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.185.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.185.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.186.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.186.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.186.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.186.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.186.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.186.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.187.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.187.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.187.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.187.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.187.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.187.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.188.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.188.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.188.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.188.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.188.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.188.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.189.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.189.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.189.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.189.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.189.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.189.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.190.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.190.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.190.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.190.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.190.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.190.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.191.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.191.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.191.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.191.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.191.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.191.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.192.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.192.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.192.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.192.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.192.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.192.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.193.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.193.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.193.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.193.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.193.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.193.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.194.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.194.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.194.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.194.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.194.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.194.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.195.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.195.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.195.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.195.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.195.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.195.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.196.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.196.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.196.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.196.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.196.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.196.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.197.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.197.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.197.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.197.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.197.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.197.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.198.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.198.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.198.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.198.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.198.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.198.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.199.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.199.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.199.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.199.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.199.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.199.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.200.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.200.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.200.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.200.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.200.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.200.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.201.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.201.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.201.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.201.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.201.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.201.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.202.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.202.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.202.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.202.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.202.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.202.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.203.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.203.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.203.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.203.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.203.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.203.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.204.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.204.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.204.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.204.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.204.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.204.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.205.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.205.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.205.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.205.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.205.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.205.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.206.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.206.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.206.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.206.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.206.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.206.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.207.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.207.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.207.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.207.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.207.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.207.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.208.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.208.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.208.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.208.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.208.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.208.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.209.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.209.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.209.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.209.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.209.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.209.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.210.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.210.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.210.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.210.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.210.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.210.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.211.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.211.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.211.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.211.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.211.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.211.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.212.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.212.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.212.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.212.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.212.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.212.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.213.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.213.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.213.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.213.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.213.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.213.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.214.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.214.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.214.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.214.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.214.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.214.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.215.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.215.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.215.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.215.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.215.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.215.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.216.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.216.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.216.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.216.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.216.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.216.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.217.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.217.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.217.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.217.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.217.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.217.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.218.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.218.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.218.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.218.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.218.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.218.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.219.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.219.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.219.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.219.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.219.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.219.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.220.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.220.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.220.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.220.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.220.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.220.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.221.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.221.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.221.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.221.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.221.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.221.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.222.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.222.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.222.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.222.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.222.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.222.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.223.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.223.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.223.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.223.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.223.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.223.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.224.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.224.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.224.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.224.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.224.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.224.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.225.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.225.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.225.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.225.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.225.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.225.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.226.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.226.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.226.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.226.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.226.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.226.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.227.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.227.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.227.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.227.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.227.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.227.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.228.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.228.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.228.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.228.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.228.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.228.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.229.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.229.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.229.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.229.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.229.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.229.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.230.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.230.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.230.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.230.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.230.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.230.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.231.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.231.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.231.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.231.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.231.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.231.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.232.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.232.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.232.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.232.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.232.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.232.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.233.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.233.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.233.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.233.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.233.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.233.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.234.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.234.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.234.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.234.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.234.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.234.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.235.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.235.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.235.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.235.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.235.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.235.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.236.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.236.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.236.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.236.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.236.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.236.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.237.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.237.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.237.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.237.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.237.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.237.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.238.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.238.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.238.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.238.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.238.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.238.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.239.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.239.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.239.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.239.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.239.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.239.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.240.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.240.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.240.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.240.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.240.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.240.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.241.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.241.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.241.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.241.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.241.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.241.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.242.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.242.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.242.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.242.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.242.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.242.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.243.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.243.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.243.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.243.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.243.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.243.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.244.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.244.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.244.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.244.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.244.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.244.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.245.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.245.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.245.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.245.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.245.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.245.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.246.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.246.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.246.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.246.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.246.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.246.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.247.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.247.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.247.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.247.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.247.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.247.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.248.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.248.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.248.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.248.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.248.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.248.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.249.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.249.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.249.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.249.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.249.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.249.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.250.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.250.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.250.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.250.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.250.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.250.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.251.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.251.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.251.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.251.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.251.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.251.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.252.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.252.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.252.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.252.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.252.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.252.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.253.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.253.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.253.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.253.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.253.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.253.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.254.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.254.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.254.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.254.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.254.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.254.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.255.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.255.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.255.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.255.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.255.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.255.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.input_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.47.post_attention_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.q_a_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.q_a_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.q_a_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.q_b_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.q_b_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.kv_b_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.kv_b_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.o_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.o_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.gate.weight": "model-00125-of-000163.safetensors", "model.layers.48.mlp.gate.e_score_correction_bias": "model-00125-of-000163.safetensors", "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.shared_experts.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.shared_experts.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.0.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.0.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.0.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.0.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.0.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.1.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.1.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.1.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.1.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.1.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.2.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.2.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.2.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.2.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.2.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.3.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.3.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.3.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.3.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.3.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.4.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.4.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.4.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.4.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.4.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.5.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.5.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.5.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.5.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.5.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.6.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.6.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.6.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.6.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.6.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.7.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.7.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.7.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.7.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.7.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.8.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.8.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.8.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.8.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.8.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.9.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.9.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.9.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.9.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.9.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.10.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.10.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.10.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.10.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.10.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.11.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.11.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.11.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.11.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.11.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.12.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.12.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.12.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.12.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.12.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.13.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.13.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.13.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.13.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.13.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.14.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.14.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.14.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.14.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.14.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.15.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.15.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.15.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.15.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.15.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.16.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.16.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.16.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.16.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.16.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.17.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.17.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.17.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.17.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.17.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.18.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.18.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.18.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.18.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.18.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.19.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.19.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.19.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.19.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.19.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.20.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.20.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.20.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.20.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.20.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.21.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.21.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.21.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.21.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.21.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.22.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.22.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.22.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.22.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.22.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.23.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.23.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.23.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.23.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.23.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.24.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.24.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.24.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.24.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.24.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.25.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.25.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.25.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.25.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.25.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.26.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.26.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.26.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.26.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.26.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.27.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.27.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.27.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.27.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.27.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.28.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.28.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.28.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.28.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.28.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.29.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.29.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.29.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.29.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.29.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.30.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.30.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.30.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.30.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.30.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.31.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.31.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.31.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.31.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.31.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.32.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.32.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.32.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.32.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.32.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.33.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.33.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.33.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.33.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.33.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.34.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.34.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.34.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.34.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.34.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.35.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.35.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.35.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.35.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.35.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.36.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.36.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.36.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.36.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.36.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.37.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.37.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.37.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.37.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.37.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.38.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.38.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.38.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.38.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.38.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.39.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.39.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.39.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.39.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.39.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.40.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.40.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.40.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.40.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.40.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.41.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.41.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.41.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.41.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.41.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.42.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.42.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.42.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.42.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.42.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.43.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.43.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.43.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.43.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.43.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.44.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.44.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.44.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.44.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.44.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.45.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.45.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.45.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.45.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.45.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.46.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.46.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.46.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.46.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.46.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.47.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.47.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.47.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.47.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.47.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.48.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.48.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.48.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.48.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.48.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.49.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.49.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.49.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.49.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.49.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.50.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.50.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.50.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.50.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.50.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.51.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.51.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.51.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.51.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.51.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.52.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.52.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.52.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.52.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.52.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.53.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.53.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.53.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.53.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.53.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.54.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.54.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.54.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.54.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.54.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.55.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.55.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.55.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.55.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.55.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.56.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.56.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.56.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.56.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.56.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.57.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.57.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.57.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.57.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.57.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.58.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.58.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.58.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.58.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.58.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.59.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.59.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.59.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.59.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.59.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.60.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.60.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.60.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.60.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.60.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.61.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.61.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.61.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.61.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.61.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.62.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.62.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.62.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.62.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.62.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.63.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.63.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.63.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.63.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.63.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.64.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.64.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.64.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.64.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.64.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.65.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.65.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.65.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.65.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.65.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.66.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.66.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.66.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.66.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.66.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.67.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.67.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.67.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.67.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.67.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.68.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.68.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.68.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.68.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.68.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.69.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.69.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.69.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.69.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.69.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.70.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.70.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.70.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.70.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.70.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.71.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.71.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.71.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.71.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.71.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.72.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.72.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.72.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.72.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.72.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.73.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.73.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.73.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.73.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.73.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.74.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.74.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.74.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.74.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.74.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.75.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.75.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.75.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.75.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.75.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.76.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.76.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.76.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.76.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.76.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.77.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.77.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.77.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.77.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.77.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.78.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.78.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.78.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.78.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.78.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.79.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.79.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.79.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.79.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.79.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.80.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.80.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.80.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.80.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.80.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.81.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.81.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.81.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.81.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.81.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.82.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.82.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.82.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.82.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.82.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.83.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.83.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.83.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.83.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.83.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.84.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.84.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.84.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.84.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.84.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.85.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.85.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.85.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.85.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.85.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.86.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.86.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.86.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.86.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.86.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.87.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.87.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.87.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.87.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.87.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.88.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.88.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.88.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.88.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.88.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.89.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.89.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.89.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.89.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.89.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.90.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.90.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.90.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.90.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.90.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.91.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.91.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.91.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.91.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.91.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.92.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.92.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.92.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.92.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.92.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.93.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.93.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.93.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.93.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.93.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.94.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.94.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.94.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.94.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.94.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.95.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.95.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.95.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.95.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.95.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.96.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.96.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.96.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.96.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.96.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.97.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.97.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.97.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.97.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.97.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.98.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.98.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.98.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.98.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.98.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.99.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.99.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.99.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.99.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.99.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.100.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.100.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.100.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.100.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.100.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.101.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.101.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.101.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.101.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.101.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.102.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.102.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.102.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.102.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.102.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.103.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.103.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.103.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.103.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.103.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.104.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.104.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.104.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.104.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.104.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.105.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.105.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.105.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.105.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.105.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.106.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.106.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.106.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.106.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.106.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.107.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.107.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.107.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.107.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.107.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.108.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.108.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.108.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.108.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.108.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.109.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.109.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.109.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.109.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.109.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.110.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.110.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.110.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.110.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.110.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.111.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.111.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.111.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.111.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.111.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.112.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.112.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.112.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.112.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.112.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.113.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.113.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.113.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.113.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.113.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.114.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.114.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.114.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.114.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.114.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.115.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.115.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.115.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.115.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.115.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.116.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.116.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.116.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.116.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.116.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.117.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.117.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.117.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.117.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.117.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.118.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.118.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.118.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.118.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.118.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.119.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.119.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.119.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.119.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.119.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.120.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.120.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.120.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.120.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.120.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.121.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.121.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.121.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.121.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.121.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.122.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.122.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.122.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.122.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.122.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.123.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.123.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.123.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.123.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.123.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.124.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.124.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.124.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.124.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.124.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.125.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.125.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.125.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.125.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.125.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.126.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.126.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.126.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.126.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.126.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.127.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.127.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.127.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.127.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.127.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.128.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.128.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.128.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.128.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.128.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.129.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.129.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.129.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.129.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.129.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.130.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.130.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.130.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.130.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.130.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.131.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.131.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.131.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.131.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.131.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.132.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.132.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.132.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.132.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.132.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.133.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.133.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.133.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.133.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.133.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.134.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.134.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.134.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.134.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.134.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.135.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.135.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.135.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.135.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.135.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.136.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.136.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.136.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.136.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.136.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.137.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.137.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.137.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.137.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.137.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.138.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.138.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.138.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.138.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.138.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.139.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.139.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.139.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.139.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.139.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.140.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.140.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.140.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.140.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.140.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.141.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.141.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.141.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.141.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.141.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.142.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.142.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.142.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.142.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.142.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.143.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.143.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.143.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.143.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.143.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.144.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.144.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.144.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.144.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.144.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.145.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.145.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.145.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.145.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.145.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.146.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.146.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.146.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.146.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.146.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.147.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.147.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.147.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.147.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.147.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.148.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.148.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.148.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.148.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.148.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.149.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.149.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.149.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.149.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.149.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.150.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.150.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.150.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.150.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.150.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.151.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.151.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.151.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.151.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.151.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.152.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.152.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.152.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.152.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.152.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.153.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.153.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.153.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.153.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.153.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.154.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.154.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.154.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.154.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.154.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.155.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.155.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.155.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.155.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.155.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.156.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.156.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.156.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.156.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.156.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.157.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.157.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.157.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.157.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.157.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.158.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.158.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.158.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.158.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.158.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.159.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.159.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.159.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.159.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.159.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.160.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.160.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.160.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.160.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.160.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.160.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.161.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.161.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.161.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.161.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.161.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.161.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.162.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.162.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.162.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.162.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.162.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.162.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.163.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.163.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.163.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.163.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.163.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.163.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.164.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.164.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.164.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.164.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.164.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.164.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.165.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.165.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.165.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.165.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.165.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.165.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.166.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.166.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.166.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.166.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.166.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.166.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.167.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.167.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.167.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.167.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.167.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.167.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.168.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.168.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.168.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.168.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.168.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.168.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.169.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.169.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.169.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.169.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.169.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.169.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.170.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.170.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.170.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.170.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.170.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.170.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.171.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.171.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.171.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.171.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.171.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.171.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.172.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.172.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.172.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.172.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.172.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.172.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.173.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.173.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.173.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.173.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.173.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.173.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.174.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.174.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.174.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.174.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.174.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.174.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.175.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.175.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.175.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.175.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.175.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.175.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.176.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.176.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.176.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.176.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.176.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.176.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.177.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.177.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.177.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.177.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.177.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.177.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.178.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.178.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.178.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.178.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.178.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.178.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.179.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.179.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.179.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.179.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.179.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.179.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.180.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.180.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.180.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.180.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.180.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.180.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.181.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.181.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.181.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.181.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.181.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.181.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.182.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.182.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.182.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.182.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.182.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.182.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.183.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.183.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.183.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.183.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.183.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.183.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.184.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.184.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.184.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.184.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.184.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.184.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.185.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.185.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.185.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.185.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.185.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.185.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.186.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.186.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.186.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.186.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.186.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.186.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.187.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.187.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.187.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.187.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.187.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.187.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.188.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.188.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.188.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.188.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.188.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.188.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.189.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.189.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.189.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.189.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.189.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.189.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.190.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.190.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.190.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.190.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.190.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.190.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.191.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.191.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.191.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.191.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.191.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.191.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.192.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.192.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.192.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.192.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.192.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.192.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.193.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.193.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.193.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.193.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.193.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.193.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.194.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.194.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.194.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.194.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.194.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.194.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.195.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.195.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.195.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.195.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.195.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.195.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.196.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.196.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.196.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.196.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.196.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.196.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.197.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.197.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.197.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.197.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.197.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.197.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.198.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.198.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.198.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.198.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.198.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.198.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.199.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.199.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.199.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.199.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.199.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.199.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.200.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.200.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.200.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.200.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.200.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.200.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.201.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.201.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.201.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.201.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.201.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.201.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.202.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.202.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.202.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.202.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.202.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.202.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.203.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.203.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.203.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.203.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.203.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.203.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.204.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.204.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.204.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.204.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.204.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.204.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.205.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.205.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.205.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.205.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.205.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.205.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.206.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.206.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.206.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.206.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.206.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.206.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.207.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.207.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.207.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.207.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.207.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.207.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.208.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.208.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.208.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.208.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.208.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.208.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.209.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.209.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.209.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.209.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.209.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.209.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.210.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.210.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.210.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.210.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.210.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.210.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.211.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.211.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.211.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.211.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.211.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.211.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.212.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.212.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.212.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.212.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.212.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.212.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.213.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.213.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.213.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.213.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.213.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.213.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.214.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.214.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.214.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.214.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.214.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.214.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.215.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.215.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.215.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.215.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.215.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.215.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.216.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.216.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.216.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.216.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.216.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.216.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.217.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.217.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.217.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.217.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.217.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.217.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.218.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.218.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.218.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.218.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.218.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.218.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.219.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.219.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.219.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.219.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.219.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.219.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.220.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.220.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.220.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.220.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.220.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.220.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.221.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.221.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.221.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.221.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.221.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.221.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.222.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.222.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.222.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.222.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.222.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.222.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.223.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.223.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.223.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.223.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.223.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.223.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.224.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.224.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.224.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.224.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.224.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.224.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.225.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.225.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.225.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.225.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.225.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.225.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.226.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.226.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.226.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.226.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.226.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.226.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.227.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.227.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.227.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.227.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.227.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.227.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.228.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.228.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.228.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.228.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.228.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.228.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.229.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.229.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.229.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.229.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.229.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.229.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.230.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.230.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.230.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.230.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.230.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.230.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.231.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.231.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.231.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.231.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.231.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.231.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.232.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.232.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.232.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.232.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.232.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.232.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.233.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.233.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.233.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.233.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.233.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.233.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.234.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.234.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.234.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.234.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.234.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.234.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.235.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.235.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.235.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.235.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.235.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.235.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.236.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.236.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.236.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.236.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.236.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.236.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.237.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.237.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.237.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.237.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.237.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.237.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.238.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.238.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.238.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.238.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.238.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.238.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.239.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.239.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.239.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.239.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.239.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.239.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.240.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.240.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.240.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.240.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.240.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.240.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.241.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.241.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.241.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.241.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.241.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.241.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.242.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.242.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.242.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.242.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.242.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.242.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.243.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.243.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.243.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.243.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.243.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.243.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.244.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.244.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.244.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.244.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.244.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.244.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.245.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.245.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.245.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.245.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.245.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.245.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.246.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.246.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.246.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.246.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.246.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.246.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.247.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.247.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.247.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.247.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.247.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.247.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.248.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.248.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.248.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.248.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.248.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.248.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.249.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.249.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.249.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.249.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.249.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.249.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.250.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.250.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.250.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.250.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.250.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.250.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.251.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.251.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.251.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.251.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.251.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.251.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.252.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.252.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.252.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.252.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.252.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.252.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.253.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.253.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.253.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.253.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.253.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.253.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.254.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.254.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.254.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.254.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.254.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.254.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.255.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.255.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.255.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.255.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.255.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.255.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.input_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.48.post_attention_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.q_a_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.q_a_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.q_a_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.q_b_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.q_b_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.kv_b_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.kv_b_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.o_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.o_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.gate.weight": "model-00128-of-000163.safetensors", "model.layers.49.mlp.gate.e_score_correction_bias": "model-00128-of-000163.safetensors", "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.shared_experts.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.shared_experts.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.0.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.0.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.0.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.0.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.0.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.1.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.1.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.1.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.1.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.1.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.2.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.2.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.2.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.2.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.2.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.3.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.3.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.3.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.3.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.3.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.4.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.4.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.4.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.4.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.4.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.5.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.5.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.5.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.5.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.5.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.6.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.6.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.6.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.6.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.6.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.7.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.7.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.7.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.7.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.7.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.8.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.8.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.8.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.8.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.8.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.9.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.9.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.9.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.9.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.9.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.10.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.10.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.10.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.10.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.10.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.11.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.11.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.11.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.11.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.11.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.12.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.12.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.12.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.12.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.12.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.13.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.13.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.13.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.13.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.13.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.14.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.14.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.14.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.14.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.14.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.15.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.15.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.15.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.15.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.15.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.16.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.16.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.16.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.16.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.16.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.17.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.17.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.17.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.17.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.17.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.18.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.18.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.18.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.18.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.18.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.19.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.19.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.19.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.19.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.19.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.20.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.20.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.20.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.20.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.20.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.21.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.21.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.21.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.21.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.21.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.22.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.22.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.22.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.22.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.22.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.23.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.23.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.23.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.23.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.23.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.24.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.24.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.24.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.24.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.24.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.25.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.25.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.25.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.25.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.25.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.26.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.26.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.26.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.26.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.26.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.27.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.27.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.27.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.27.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.27.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.28.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.28.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.28.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.28.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.28.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.29.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.29.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.29.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.29.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.29.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.30.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.30.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.30.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.30.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.30.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.31.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.31.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.31.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.31.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.31.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.32.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.32.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.32.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.32.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.32.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.33.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.33.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.33.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.33.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.33.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.34.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.34.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.34.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.34.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.34.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.35.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.35.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.35.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.35.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.35.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.36.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.36.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.36.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.36.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.36.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.37.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.37.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.37.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.37.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.37.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.38.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.38.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.38.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.38.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.38.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.39.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.39.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.39.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.39.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.39.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.40.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.40.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.40.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.40.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.40.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.41.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.41.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.41.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.41.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.41.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.42.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.42.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.42.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.42.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.42.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.43.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.43.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.43.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.43.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.43.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.44.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.44.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.44.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.44.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.44.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.45.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.45.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.45.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.45.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.45.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.46.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.46.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.46.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.46.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.46.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.47.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.47.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.47.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.47.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.47.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.48.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.48.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.48.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.48.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.48.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.49.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.49.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.49.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.49.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.49.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.50.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.50.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.50.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.50.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.50.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.51.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.51.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.51.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.51.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.51.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.52.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.52.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.52.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.52.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.52.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.53.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.53.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.53.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.53.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.53.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.54.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.54.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.54.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.54.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.54.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.55.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.55.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.55.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.55.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.55.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.56.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.56.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.56.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.56.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.56.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.57.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.57.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.57.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.57.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.57.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.58.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.58.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.58.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.58.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.58.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.59.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.59.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.59.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.59.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.59.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.60.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.60.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.60.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.60.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.60.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.61.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.61.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.61.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.61.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.61.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.62.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.62.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.62.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.62.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.62.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.63.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.63.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.63.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.63.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.63.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.64.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.64.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.64.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.64.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.64.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.65.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.65.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.65.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.65.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.65.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.66.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.66.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.66.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.66.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.66.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.67.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.67.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.67.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.67.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.67.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.68.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.68.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.68.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.68.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.68.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.69.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.69.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.69.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.69.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.69.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.70.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.70.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.70.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.70.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.70.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.71.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.71.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.71.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.71.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.71.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.72.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.72.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.72.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.72.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.72.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.73.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.73.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.73.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.73.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.73.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.74.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.74.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.74.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.74.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.74.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.75.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.75.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.75.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.75.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.75.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.76.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.76.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.76.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.76.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.76.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.77.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.77.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.77.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.77.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.77.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.78.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.78.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.78.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.78.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.78.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.79.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.79.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.79.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.79.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.79.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.80.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.80.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.80.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.80.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.80.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.81.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.81.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.81.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.81.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.81.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.82.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.82.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.82.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.82.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.82.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.83.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.83.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.83.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.83.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.83.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.84.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.84.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.84.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.84.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.84.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.85.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.85.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.85.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.85.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.85.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.86.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.86.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.86.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.86.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.86.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.87.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.87.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.87.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.87.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.87.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.88.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.88.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.88.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.88.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.88.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.89.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.89.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.89.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.89.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.89.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.90.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.90.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.90.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.90.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.90.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.91.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.91.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.91.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.91.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.91.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.92.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.92.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.92.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.92.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.92.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.93.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.93.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.93.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.93.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.93.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.94.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.94.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.94.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.94.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.94.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.95.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.95.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.95.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.95.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.95.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.96.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.96.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.96.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.96.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.96.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.97.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.97.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.97.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.97.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.97.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.98.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.98.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.98.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.98.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.98.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.99.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.99.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.99.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.99.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.99.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.100.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.100.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.100.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.100.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.100.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.101.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.101.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.101.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.101.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.101.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.102.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.102.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.102.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.102.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.102.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.103.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.103.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.103.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.103.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.103.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.104.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.104.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.104.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.104.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.104.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.105.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.105.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.105.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.105.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.105.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.106.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.106.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.106.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.106.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.106.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.107.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.107.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.107.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.107.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.107.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.108.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.108.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.108.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.108.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.108.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.109.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.109.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.109.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.109.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.109.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.110.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.110.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.110.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.110.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.110.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.111.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.111.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.111.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.111.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.111.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.112.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.112.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.112.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.112.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.112.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.113.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.113.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.113.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.113.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.113.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.114.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.114.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.114.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.114.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.114.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.115.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.115.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.115.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.115.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.115.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.116.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.116.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.116.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.116.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.116.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.117.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.117.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.117.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.117.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.117.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.118.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.118.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.118.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.118.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.118.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.119.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.119.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.119.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.119.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.119.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.120.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.120.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.120.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.120.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.120.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.121.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.121.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.121.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.121.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.121.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.122.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.122.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.122.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.122.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.122.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.123.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.123.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.123.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.123.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.123.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.124.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.124.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.124.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.124.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.124.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.125.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.125.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.125.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.125.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.125.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.126.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.126.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.126.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.126.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.126.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.127.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.127.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.127.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.127.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.127.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.128.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.128.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.128.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.128.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.128.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.129.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.129.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.129.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.129.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.129.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.130.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.130.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.130.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.130.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.130.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.131.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.131.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.131.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.131.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.131.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.132.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.132.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.132.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.132.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.132.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.133.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.133.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.133.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.133.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.133.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.134.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.134.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.134.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.134.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.134.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.135.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.135.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.135.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.135.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.135.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.136.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.136.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.136.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.136.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.136.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.137.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.137.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.137.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.137.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.137.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.138.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.138.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.138.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.138.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.138.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.139.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.139.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.139.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.139.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.139.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.140.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.140.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.140.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.140.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.140.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.141.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.141.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.141.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.141.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.141.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.142.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.142.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.142.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.142.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.142.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.143.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.143.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.143.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.143.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.143.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.144.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.144.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.144.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.144.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.144.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.145.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.145.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.145.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.145.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.145.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.146.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.146.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.146.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.146.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.146.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.147.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.147.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.147.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.147.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.147.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.148.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.148.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.148.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.148.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.148.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.149.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.149.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.149.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.149.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.149.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.150.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.150.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.150.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.150.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.150.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.151.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.151.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.151.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.151.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.151.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.152.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.152.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.152.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.152.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.152.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.153.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.153.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.153.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.153.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.153.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.154.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.154.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.154.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.154.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.154.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.155.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.155.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.155.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.155.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.155.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.156.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.156.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.156.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.156.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.156.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.157.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.157.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.157.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.157.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.157.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.158.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.158.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.158.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.158.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.158.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.159.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.159.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.159.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.159.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.159.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.160.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.160.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.160.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.160.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.160.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.160.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.161.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.161.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.161.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.161.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.161.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.161.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.162.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.162.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.162.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.162.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.162.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.162.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.163.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.163.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.163.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.163.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.163.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.163.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.164.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.164.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.164.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.164.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.164.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.164.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.165.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.165.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.165.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.165.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.165.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.165.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.166.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.166.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.166.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.166.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.166.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.166.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.167.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.167.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.167.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.167.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.167.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.167.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.168.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.168.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.168.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.168.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.168.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.168.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.169.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.169.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.169.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.169.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.169.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.169.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.170.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.170.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.170.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.170.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.170.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.170.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.171.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.171.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.171.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.171.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.171.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.171.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.172.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.172.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.172.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.172.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.172.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.172.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.173.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.173.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.173.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.173.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.173.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.173.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.174.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.174.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.174.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.174.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.174.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.174.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.175.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.175.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.175.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.175.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.175.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.175.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.176.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.176.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.176.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.176.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.176.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.176.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.177.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.177.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.177.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.177.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.177.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.177.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.178.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.178.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.178.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.178.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.178.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.178.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.179.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.179.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.179.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.179.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.179.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.179.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.180.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.180.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.180.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.180.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.180.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.180.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.181.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.181.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.181.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.181.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.181.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.181.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.182.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.182.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.182.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.182.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.182.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.182.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.183.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.183.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.183.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.183.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.183.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.183.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.184.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.184.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.184.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.184.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.184.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.184.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.185.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.185.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.185.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.185.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.185.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.185.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.186.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.186.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.186.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.186.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.186.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.186.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.187.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.187.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.187.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.187.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.187.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.187.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.188.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.188.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.188.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.188.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.188.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.188.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.189.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.189.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.189.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.189.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.189.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.189.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.190.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.190.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.190.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.190.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.190.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.190.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.191.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.191.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.191.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.191.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.191.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.191.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.192.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.192.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.192.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.192.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.192.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.192.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.193.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.193.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.193.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.193.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.193.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.193.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.194.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.194.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.194.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.194.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.194.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.194.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.195.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.195.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.195.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.195.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.195.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.195.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.196.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.196.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.196.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.196.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.196.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.196.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.197.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.197.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.197.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.197.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.197.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.197.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.198.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.198.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.198.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.198.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.198.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.198.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.199.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.199.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.199.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.199.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.199.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.199.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.200.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.200.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.200.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.200.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.200.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.200.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.201.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.201.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.201.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.201.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.201.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.201.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.202.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.202.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.202.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.202.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.202.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.202.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.203.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.203.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.203.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.203.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.203.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.203.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.204.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.204.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.204.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.204.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.204.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.204.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.205.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.205.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.205.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.205.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.205.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.205.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.206.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.206.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.206.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.206.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.206.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.206.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.207.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.207.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.207.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.207.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.207.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.207.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.208.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.208.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.208.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.208.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.208.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.208.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.209.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.209.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.209.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.209.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.209.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.209.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.210.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.210.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.210.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.210.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.210.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.210.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.211.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.211.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.211.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.211.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.211.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.211.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.212.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.212.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.212.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.212.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.212.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.212.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.213.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.213.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.213.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.213.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.213.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.213.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.214.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.214.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.214.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.214.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.214.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.214.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.215.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.215.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.215.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.215.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.215.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.215.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.216.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.216.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.216.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.216.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.216.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.216.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.217.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.217.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.217.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.217.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.217.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.217.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.218.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.218.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.218.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.218.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.218.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.218.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.219.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.219.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.219.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.219.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.219.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.219.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.220.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.220.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.220.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.220.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.220.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.220.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.221.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.221.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.221.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.221.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.221.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.221.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.222.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.222.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.222.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.222.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.222.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.222.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.223.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.223.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.223.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.223.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.223.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.223.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.224.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.224.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.224.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.224.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.224.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.224.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.225.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.225.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.225.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.225.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.225.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.225.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.226.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.226.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.226.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.226.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.226.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.226.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.227.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.227.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.227.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.227.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.227.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.227.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.228.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.228.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.228.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.228.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.228.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.228.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.229.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.229.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.229.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.229.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.229.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.229.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.230.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.230.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.230.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.230.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.230.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.230.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.231.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.231.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.231.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.231.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.231.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.231.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.232.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.232.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.232.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.232.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.232.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.232.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.233.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.233.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.233.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.233.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.233.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.233.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.234.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.234.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.234.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.234.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.234.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.234.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.235.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.235.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.235.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.235.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.235.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.235.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.236.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.236.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.236.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.236.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.236.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.236.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.237.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.237.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.237.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.237.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.237.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.237.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.238.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.238.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.238.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.238.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.238.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.238.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.239.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.239.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.239.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.239.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.239.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.239.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.240.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.240.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.240.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.240.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.240.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.240.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.241.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.241.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.241.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.241.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.241.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.241.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.242.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.242.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.242.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.242.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.242.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.242.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.243.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.243.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.243.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.243.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.243.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.243.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.244.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.244.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.244.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.244.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.244.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.244.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.245.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.245.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.245.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.245.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.245.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.245.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.246.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.246.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.246.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.246.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.246.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.246.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.247.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.247.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.247.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.247.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.247.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.247.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.248.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.248.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.248.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.248.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.248.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.248.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.249.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.249.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.249.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.249.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.249.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.249.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.250.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.250.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.250.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.250.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.250.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.250.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.251.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.251.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.251.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.251.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.251.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.251.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.252.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.252.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.252.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.252.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.252.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.252.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.253.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.253.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.253.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.253.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.253.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.253.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.254.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.254.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.254.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.254.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.254.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.254.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.255.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.255.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.255.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.255.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.255.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.255.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.input_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.49.post_attention_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.q_a_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.q_a_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.q_a_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.q_b_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.q_b_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.kv_b_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.kv_b_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.o_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.o_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.gate.weight": "model-00131-of-000163.safetensors", "model.layers.50.mlp.gate.e_score_correction_bias": "model-00131-of-000163.safetensors", "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.shared_experts.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.shared_experts.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.0.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.0.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.0.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.0.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.0.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.1.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.1.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.1.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.1.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.1.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.2.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.2.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.2.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.2.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.2.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.3.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.3.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.3.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.3.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.3.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.4.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.4.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.4.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.4.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.4.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.5.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.5.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.5.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.5.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.5.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.6.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.6.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.6.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.6.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.6.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.7.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.7.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.7.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.7.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.7.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.8.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.8.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.8.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.8.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.8.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.9.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.9.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.9.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.9.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.9.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.10.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.10.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.10.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.10.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.10.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.11.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.11.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.11.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.11.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.11.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.12.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.12.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.12.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.12.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.12.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.13.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.13.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.13.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.13.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.13.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.14.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.14.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.14.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.14.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.14.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.15.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.15.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.15.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.15.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.15.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.16.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.16.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.16.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.16.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.16.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.17.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.17.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.17.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.17.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.17.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.18.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.18.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.18.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.18.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.18.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.19.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.19.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.19.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.19.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.19.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.20.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.20.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.20.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.20.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.20.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.21.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.21.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.21.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.21.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.21.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.22.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.22.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.22.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.22.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.22.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.23.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.23.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.23.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.23.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.23.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.24.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.24.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.24.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.24.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.24.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.25.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.25.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.25.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.25.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.25.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.26.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.26.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.26.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.26.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.26.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.27.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.27.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.27.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.27.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.27.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.28.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.28.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.28.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.28.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.28.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.29.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.29.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.29.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.29.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.29.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.30.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.30.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.30.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.30.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.30.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.31.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.31.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.31.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.31.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.31.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.32.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.32.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.32.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.32.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.32.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.33.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.33.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.33.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.33.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.33.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.34.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.34.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.34.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.34.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.34.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.35.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.35.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.35.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.35.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.35.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.36.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.36.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.36.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.36.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.36.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.37.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.37.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.37.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.37.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.37.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.38.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.38.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.38.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.38.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.38.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.39.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.39.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.39.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.39.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.39.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.40.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.40.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.40.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.40.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.40.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.41.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.41.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.41.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.41.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.41.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.42.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.42.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.42.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.42.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.42.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.43.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.43.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.43.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.43.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.43.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.44.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.44.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.44.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.44.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.44.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.45.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.45.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.45.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.45.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.45.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.46.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.46.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.46.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.46.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.46.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.47.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.47.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.47.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.47.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.47.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.48.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.48.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.48.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.48.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.48.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.49.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.49.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.49.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.49.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.49.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.50.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.50.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.50.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.50.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.50.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.51.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.51.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.51.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.51.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.51.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.52.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.52.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.52.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.52.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.52.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.53.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.53.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.53.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.53.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.53.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.54.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.54.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.54.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.54.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.54.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.55.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.55.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.55.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.55.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.55.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.56.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.56.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.56.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.56.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.56.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.57.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.57.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.57.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.57.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.57.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.58.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.58.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.58.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.58.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.58.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.59.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.59.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.59.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.59.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.59.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.60.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.60.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.60.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.60.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.60.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.61.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.61.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.61.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.61.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.61.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.62.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.62.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.62.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.62.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.62.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.63.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.63.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.63.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.63.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.63.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.64.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.64.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.64.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.64.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.64.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.65.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.65.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.65.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.65.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.65.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.66.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.66.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.66.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.66.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.66.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.67.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.67.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.67.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.67.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.67.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.68.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.68.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.68.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.68.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.68.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.69.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.69.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.69.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.69.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.69.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.70.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.70.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.70.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.70.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.70.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.71.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.71.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.71.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.71.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.71.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.72.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.72.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.72.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.72.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.72.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.73.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.73.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.73.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.73.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.73.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.74.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.74.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.74.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.74.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.74.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.75.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.75.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.75.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.75.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.75.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.76.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.76.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.76.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.76.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.76.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.77.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.77.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.77.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.77.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.77.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.78.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.78.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.78.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.78.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.78.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.79.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.79.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.79.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.79.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.79.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.80.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.80.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.80.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.80.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.80.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.81.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.81.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.81.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.81.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.81.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.82.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.82.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.82.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.82.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.82.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.83.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.83.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.83.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.83.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.83.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.84.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.84.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.84.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.84.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.84.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.85.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.85.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.85.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.85.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.85.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.86.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.86.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.86.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.86.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.86.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.87.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.87.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.87.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.87.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.87.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.88.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.88.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.88.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.88.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.88.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.89.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.89.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.89.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.89.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.89.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.90.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.90.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.90.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.90.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.90.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.91.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.91.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.91.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.91.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.91.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.92.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.92.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.92.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.92.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.92.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.93.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.93.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.93.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.93.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.93.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.94.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.94.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.94.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.94.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.94.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.95.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.95.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.95.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.95.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.95.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.96.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.96.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.96.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.96.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.96.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.97.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.97.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.97.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.97.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.97.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.98.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.98.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.98.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.98.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.98.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.99.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.99.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.99.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.99.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.99.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.100.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.100.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.100.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.100.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.100.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.101.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.101.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.101.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.101.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.101.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.102.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.102.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.102.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.102.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.102.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.103.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.103.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.103.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.103.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.103.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.104.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.104.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.104.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.104.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.104.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.105.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.105.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.105.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.105.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.105.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.106.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.106.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.106.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.106.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.106.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.107.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.107.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.107.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.107.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.107.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.108.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.108.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.108.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.108.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.108.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.109.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.109.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.109.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.109.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.109.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.110.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.110.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.110.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.110.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.110.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.111.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.111.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.111.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.111.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.111.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.112.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.112.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.112.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.112.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.112.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.113.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.113.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.113.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.113.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.113.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.114.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.114.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.114.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.114.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.114.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.115.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.115.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.115.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.115.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.115.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.116.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.116.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.116.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.116.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.116.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.117.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.117.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.117.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.117.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.117.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.118.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.118.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.118.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.118.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.118.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.119.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.119.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.119.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.119.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.119.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.120.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.120.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.120.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.120.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.120.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.121.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.121.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.121.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.121.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.121.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.122.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.122.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.122.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.122.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.122.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.123.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.123.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.123.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.123.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.123.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.124.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.124.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.124.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.124.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.124.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.125.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.125.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.125.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.125.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.125.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.126.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.126.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.126.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.126.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.126.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.127.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.127.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.127.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.127.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.127.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.128.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.128.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.128.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.128.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.128.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.129.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.129.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.129.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.129.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.129.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.130.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.130.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.130.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.130.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.130.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.131.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.131.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.131.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.131.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.131.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.132.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.132.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.132.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.132.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.132.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.133.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.133.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.133.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.133.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.133.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.134.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.134.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.134.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.134.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.134.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.135.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.135.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.135.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.135.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.135.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.136.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.136.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.136.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.136.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.136.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.137.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.137.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.137.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.137.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.137.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.138.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.138.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.138.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.138.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.138.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.139.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.139.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.139.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.139.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.139.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.140.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.140.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.140.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.140.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.140.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.141.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.141.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.141.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.141.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.141.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.142.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.142.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.142.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.142.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.142.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.143.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.143.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.143.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.143.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.143.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.144.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.144.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.144.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.144.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.144.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.145.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.145.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.145.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.145.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.145.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.146.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.146.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.146.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.146.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.146.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.147.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.147.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.147.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.147.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.147.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.148.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.148.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.148.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.148.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.148.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.149.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.149.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.149.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.149.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.149.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.150.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.150.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.150.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.150.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.150.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.151.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.151.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.151.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.151.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.151.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.152.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.152.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.152.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.152.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.152.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.153.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.153.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.153.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.153.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.153.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.154.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.154.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.154.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.154.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.154.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.155.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.155.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.155.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.155.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.155.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.156.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.156.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.156.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.156.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.156.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.157.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.157.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.157.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.157.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.157.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.158.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.158.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.158.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.158.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.158.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.159.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.159.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.159.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.159.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.159.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.160.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.160.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.160.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.160.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.160.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.160.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.161.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.161.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.161.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.161.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.161.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.161.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.162.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.162.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.162.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.162.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.162.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.162.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.163.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.163.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.163.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.163.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.163.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.163.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.164.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.164.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.164.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.164.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.164.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.164.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.165.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.165.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.165.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.165.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.165.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.165.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.166.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.166.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.166.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.166.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.166.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.166.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.167.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.167.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.167.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.167.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.167.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.167.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.168.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.168.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.168.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.168.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.168.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.168.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.169.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.169.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.169.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.169.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.169.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.169.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.170.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.170.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.170.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.170.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.170.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.170.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.171.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.171.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.171.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.171.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.171.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.171.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.172.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.172.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.172.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.172.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.172.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.172.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.173.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.173.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.173.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.173.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.173.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.173.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.174.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.174.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.174.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.174.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.174.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.174.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.175.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.175.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.175.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.175.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.175.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.175.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.176.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.176.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.176.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.176.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.176.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.176.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.177.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.177.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.177.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.177.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.177.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.177.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.178.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.178.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.178.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.178.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.178.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.178.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.179.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.179.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.179.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.179.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.179.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.179.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.180.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.180.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.180.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.180.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.180.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.180.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.181.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.181.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.181.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.181.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.181.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.181.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.182.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.182.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.182.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.182.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.182.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.182.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.183.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.183.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.183.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.183.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.183.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.183.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.184.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.184.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.184.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.184.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.184.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.184.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.185.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.185.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.185.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.185.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.185.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.185.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.186.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.186.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.186.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.186.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.186.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.186.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.187.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.187.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.187.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.187.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.187.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.187.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.188.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.188.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.188.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.188.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.188.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.188.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.189.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.189.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.189.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.189.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.189.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.189.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.190.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.190.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.190.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.190.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.190.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.190.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.191.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.191.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.191.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.191.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.191.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.191.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.192.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.192.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.192.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.192.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.192.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.192.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.193.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.193.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.193.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.193.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.193.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.193.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.194.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.194.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.194.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.194.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.194.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.194.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.195.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.195.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.195.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.195.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.195.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.195.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.196.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.196.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.196.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.196.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.196.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.196.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.197.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.197.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.197.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.197.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.197.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.197.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.198.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.198.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.198.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.198.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.198.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.198.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.199.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.199.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.199.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.199.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.199.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.199.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.200.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.200.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.200.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.200.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.200.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.200.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.201.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.201.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.201.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.201.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.201.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.201.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.202.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.202.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.202.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.202.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.202.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.202.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.203.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.203.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.203.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.203.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.203.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.203.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.204.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.204.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.204.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.204.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.204.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.204.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.205.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.205.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.205.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.205.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.205.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.205.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.206.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.206.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.206.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.206.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.206.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.206.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.207.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.207.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.207.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.207.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.207.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.207.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.208.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.208.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.208.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.208.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.208.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.208.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.209.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.209.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.209.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.209.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.209.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.209.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.210.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.210.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.210.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.210.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.210.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.210.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.211.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.211.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.211.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.211.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.211.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.211.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.212.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.212.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.212.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.212.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.212.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.212.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.213.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.213.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.213.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.213.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.213.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.213.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.214.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.214.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.214.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.214.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.214.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.214.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.215.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.215.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.215.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.215.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.215.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.215.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.216.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.216.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.216.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.216.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.216.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.216.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.217.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.217.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.217.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.217.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.217.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.217.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.218.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.218.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.218.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.218.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.218.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.218.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.219.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.219.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.219.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.219.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.219.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.219.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.220.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.220.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.220.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.220.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.220.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.220.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.221.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.221.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.221.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.221.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.221.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.221.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.222.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.222.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.222.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.222.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.222.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.222.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.223.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.223.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.223.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.223.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.223.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.223.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.224.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.224.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.224.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.224.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.224.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.224.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.225.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.225.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.225.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.225.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.225.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.225.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.226.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.226.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.226.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.226.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.226.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.226.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.227.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.227.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.227.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.227.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.227.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.227.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.228.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.228.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.228.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.228.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.228.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.228.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.229.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.229.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.229.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.229.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.229.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.229.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.230.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.230.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.230.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.230.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.230.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.230.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.231.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.231.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.231.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.231.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.231.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.231.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.232.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.232.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.232.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.232.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.232.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.232.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.233.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.233.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.233.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.233.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.233.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.233.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.234.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.234.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.234.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.234.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.234.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.234.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.235.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.235.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.235.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.235.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.235.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.235.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.236.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.236.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.236.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.236.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.236.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.236.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.237.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.237.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.237.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.237.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.237.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.237.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.238.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.238.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.238.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.238.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.238.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.238.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.239.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.239.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.239.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.239.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.239.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.239.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.240.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.240.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.240.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.240.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.240.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.240.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.241.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.241.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.241.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.241.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.241.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.241.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.242.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.242.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.242.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.242.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.242.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.242.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.243.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.243.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.243.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.243.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.243.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.243.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.244.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.244.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.244.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.244.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.244.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.244.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.245.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.245.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.245.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.245.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.245.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.245.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.246.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.246.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.246.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.246.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.246.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.246.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.247.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.247.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.247.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.247.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.247.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.247.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.248.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.248.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.248.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.248.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.248.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.248.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.249.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.249.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.249.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.249.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.249.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.249.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.250.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.250.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.250.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.250.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.250.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.250.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.251.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.251.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.251.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.251.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.251.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.251.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.252.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.252.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.252.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.252.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.252.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.252.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.253.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.253.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.253.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.253.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.253.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.253.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.254.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.254.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.254.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.254.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.254.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.254.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.255.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.255.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.255.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.255.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.255.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.255.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.input_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.50.post_attention_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.q_a_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.q_a_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.q_a_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.q_b_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.q_b_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.kv_b_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.kv_b_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.o_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.o_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.gate.weight": "model-00133-of-000163.safetensors", "model.layers.51.mlp.gate.e_score_correction_bias": "model-00133-of-000163.safetensors", "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.shared_experts.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.shared_experts.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.0.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.0.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.0.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.0.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.0.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.1.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.1.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.1.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.1.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.1.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.2.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.2.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.2.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.2.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.2.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.3.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.3.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.3.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.3.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.3.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.4.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.4.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.4.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.4.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.4.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.5.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.5.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.5.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.5.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.5.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.6.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.6.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.6.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.6.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.6.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.7.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.7.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.7.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.7.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.7.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.8.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.8.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.8.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.8.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.8.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.9.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.9.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.9.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.9.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.9.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.10.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.10.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.10.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.10.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.10.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.11.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.11.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.11.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.11.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.11.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.12.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.12.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.12.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.12.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.12.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.13.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.13.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.13.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.13.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.13.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.14.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.14.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.14.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.14.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.14.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.15.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.15.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.15.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.15.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.15.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.16.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.16.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.16.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.16.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.16.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.17.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.17.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.17.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.17.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.17.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.18.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.18.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.18.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.18.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.18.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.19.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.19.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.19.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.19.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.19.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.20.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.20.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.20.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.20.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.20.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.21.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.21.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.21.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.21.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.21.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.22.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.22.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.22.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.22.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.22.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.23.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.23.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.23.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.23.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.23.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.24.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.24.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.24.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.24.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.24.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.25.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.25.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.25.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.25.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.25.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.26.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.26.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.26.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.26.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.26.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.27.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.27.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.27.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.27.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.27.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.28.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.28.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.28.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.28.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.28.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.29.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.29.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.29.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.29.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.29.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.30.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.30.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.30.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.30.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.30.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.31.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.31.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.31.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.31.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.31.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.32.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.32.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.32.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.32.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.32.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.33.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.33.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.33.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.33.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.33.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.34.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.34.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.34.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.34.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.34.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.35.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.35.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.35.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.35.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.35.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.36.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.36.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.36.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.36.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.36.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.37.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.37.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.37.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.37.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.37.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.38.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.38.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.38.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.38.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.38.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.39.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.39.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.39.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.39.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.39.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.40.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.40.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.40.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.40.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.40.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.41.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.41.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.41.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.41.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.41.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.42.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.42.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.42.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.42.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.42.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.43.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.43.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.43.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.43.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.43.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.44.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.44.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.44.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.44.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.44.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.45.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.45.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.45.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.45.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.45.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.46.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.46.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.46.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.46.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.46.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.47.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.47.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.47.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.47.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.47.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.48.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.48.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.48.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.48.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.48.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.49.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.49.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.49.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.49.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.49.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.50.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.50.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.50.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.50.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.50.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.51.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.51.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.51.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.51.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.51.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.52.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.52.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.52.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.52.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.52.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.53.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.53.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.53.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.53.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.53.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.54.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.54.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.54.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.54.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.54.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.55.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.55.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.55.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.55.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.55.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.56.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.56.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.56.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.56.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.56.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.57.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.57.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.57.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.57.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.57.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.58.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.58.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.58.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.58.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.58.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.59.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.59.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.59.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.59.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.59.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.60.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.60.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.60.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.60.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.60.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.61.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.61.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.61.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.61.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.61.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.62.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.62.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.62.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.62.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.62.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.63.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.63.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.63.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.63.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.63.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.64.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.64.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.64.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.64.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.64.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.65.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.65.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.65.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.65.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.65.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.66.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.66.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.66.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.66.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.66.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.67.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.67.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.67.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.67.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.67.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.68.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.68.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.68.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.68.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.68.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.69.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.69.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.69.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.69.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.69.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.70.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.70.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.70.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.70.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.70.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.71.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.71.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.71.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.71.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.71.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.72.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.72.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.72.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.72.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.72.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.73.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.73.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.73.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.73.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.73.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.74.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.74.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.74.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.74.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.74.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.75.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.75.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.75.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.75.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.75.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.76.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.76.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.76.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.76.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.76.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.77.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.77.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.77.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.77.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.77.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.78.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.78.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.78.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.78.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.78.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.79.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.79.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.79.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.79.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.79.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.80.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.80.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.80.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.80.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.80.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.81.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.81.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.81.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.81.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.81.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.82.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.82.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.82.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.82.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.82.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.83.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.83.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.83.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.83.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.83.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.84.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.84.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.84.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.84.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.84.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.85.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.85.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.85.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.85.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.85.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.86.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.86.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.86.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.86.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.86.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.87.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.87.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.87.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.87.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.87.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.88.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.88.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.88.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.88.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.88.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.89.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.89.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.89.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.89.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.89.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.90.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.90.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.90.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.90.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.90.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.91.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.91.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.91.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.91.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.91.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.92.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.92.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.92.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.92.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.92.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.93.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.93.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.93.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.93.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.93.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.94.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.94.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.94.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.94.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.94.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.95.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.95.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.95.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.95.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.95.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.96.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.96.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.96.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.96.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.96.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.97.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.97.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.97.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.97.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.97.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.98.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.98.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.98.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.98.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.98.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.99.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.99.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.99.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.99.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.99.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.100.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.100.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.100.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.100.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.100.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.101.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.101.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.101.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.101.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.101.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.102.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.102.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.102.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.102.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.102.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.103.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.103.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.103.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.103.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.103.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.104.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.104.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.104.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.104.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.104.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.105.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.105.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.105.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.105.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.105.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.106.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.106.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.106.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.106.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.106.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.107.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.107.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.107.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.107.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.107.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.108.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.108.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.108.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.108.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.108.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.109.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.109.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.109.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.109.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.109.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.110.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.110.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.110.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.110.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.110.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.111.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.111.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.111.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.111.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.111.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.112.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.112.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.112.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.112.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.112.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.113.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.113.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.113.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.113.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.113.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.114.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.114.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.114.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.114.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.114.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.115.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.115.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.115.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.115.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.115.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.116.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.116.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.116.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.116.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.116.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.117.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.117.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.117.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.117.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.117.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.118.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.118.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.118.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.118.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.118.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.119.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.119.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.119.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.119.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.119.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.120.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.120.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.120.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.120.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.120.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.121.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.121.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.121.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.121.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.121.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.122.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.122.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.122.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.122.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.122.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.123.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.123.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.123.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.123.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.123.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.124.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.124.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.124.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.124.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.124.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.125.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.125.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.125.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.125.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.125.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.126.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.126.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.126.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.126.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.126.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.127.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.127.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.127.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.127.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.127.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.128.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.128.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.128.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.128.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.128.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.129.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.129.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.129.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.129.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.129.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.130.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.130.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.130.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.130.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.130.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.131.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.131.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.131.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.131.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.131.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.132.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.132.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.132.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.132.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.132.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.133.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.133.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.133.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.133.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.133.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.134.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.134.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.134.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.134.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.134.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.135.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.135.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.135.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.135.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.135.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.136.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.136.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.136.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.136.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.136.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.137.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.137.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.137.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.137.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.137.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.138.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.138.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.138.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.138.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.138.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.139.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.139.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.139.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.139.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.139.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.140.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.140.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.140.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.140.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.140.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.141.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.141.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.141.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.141.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.141.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.142.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.142.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.142.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.142.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.142.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.143.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.143.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.143.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.143.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.143.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.144.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.144.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.144.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.144.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.144.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.145.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.145.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.145.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.145.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.145.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.146.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.146.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.146.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.146.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.146.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.147.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.147.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.147.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.147.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.147.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.148.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.148.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.148.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.148.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.148.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.149.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.149.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.149.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.149.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.149.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.150.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.150.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.150.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.150.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.150.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.151.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.151.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.151.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.151.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.151.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.152.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.152.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.152.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.152.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.152.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.153.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.153.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.153.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.153.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.153.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.154.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.154.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.154.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.154.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.154.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.155.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.155.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.155.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.155.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.155.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.156.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.156.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.156.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.156.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.156.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.157.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.157.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.157.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.157.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.157.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.158.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.158.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.158.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.158.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.158.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.159.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.159.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.159.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.159.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.159.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.160.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.160.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.160.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.160.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.160.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.160.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.161.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.161.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.161.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.161.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.161.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.161.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.162.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.162.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.162.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.162.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.162.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.162.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.163.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.163.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.163.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.163.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.163.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.163.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.164.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.164.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.164.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.164.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.164.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.164.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.165.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.165.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.165.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.165.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.165.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.165.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.166.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.166.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.166.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.166.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.166.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.166.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.167.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.167.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.167.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.167.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.167.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.167.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.168.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.168.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.168.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.168.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.168.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.168.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.169.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.169.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.169.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.169.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.169.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.169.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.170.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.170.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.170.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.170.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.170.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.170.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.171.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.171.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.171.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.171.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.171.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.171.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.172.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.172.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.172.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.172.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.172.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.172.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.173.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.173.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.173.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.173.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.173.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.173.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.174.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.174.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.174.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.174.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.174.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.174.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.175.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.175.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.175.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.175.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.175.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.175.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.176.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.176.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.176.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.176.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.176.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.176.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.177.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.177.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.177.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.177.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.177.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.177.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.178.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.178.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.178.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.178.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.178.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.178.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.179.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.179.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.179.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.179.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.179.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.179.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.180.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.180.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.180.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.180.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.180.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.180.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.181.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.181.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.181.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.181.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.181.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.181.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.182.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.182.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.182.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.182.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.182.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.182.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.183.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.183.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.183.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.183.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.183.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.183.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.184.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.184.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.184.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.184.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.184.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.184.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.185.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.185.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.185.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.185.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.185.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.185.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.186.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.186.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.186.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.186.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.186.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.186.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.187.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.187.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.187.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.187.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.187.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.187.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.188.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.188.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.188.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.188.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.188.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.188.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.189.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.189.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.189.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.189.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.189.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.189.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.190.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.190.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.190.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.190.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.190.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.190.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.191.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.191.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.191.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.191.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.191.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.191.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.192.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.192.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.192.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.192.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.192.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.192.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.193.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.193.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.193.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.193.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.193.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.193.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.194.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.194.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.194.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.194.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.194.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.194.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.195.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.195.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.195.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.195.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.195.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.195.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.196.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.196.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.196.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.196.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.196.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.196.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.197.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.197.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.197.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.197.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.197.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.197.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.198.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.198.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.198.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.198.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.198.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.198.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.199.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.199.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.199.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.199.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.199.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.199.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.200.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.200.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.200.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.200.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.200.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.200.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.201.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.201.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.201.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.201.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.201.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.201.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.202.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.202.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.202.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.202.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.202.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.202.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.203.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.203.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.203.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.203.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.203.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.203.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.204.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.204.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.204.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.204.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.204.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.204.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.205.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.205.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.205.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.205.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.205.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.205.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.206.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.206.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.206.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.206.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.206.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.206.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.207.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.207.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.207.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.207.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.207.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.207.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.208.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.208.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.208.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.208.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.208.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.208.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.209.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.209.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.209.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.209.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.209.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.209.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.210.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.210.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.210.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.210.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.210.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.210.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.211.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.211.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.211.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.211.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.211.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.211.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.212.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.212.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.212.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.212.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.212.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.212.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.213.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.213.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.213.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.213.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.213.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.213.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.214.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.214.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.214.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.214.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.214.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.214.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.215.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.215.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.215.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.215.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.215.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.215.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.216.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.216.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.216.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.216.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.216.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.216.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.217.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.217.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.217.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.217.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.217.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.217.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.218.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.218.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.218.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.218.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.218.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.218.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.219.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.219.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.219.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.219.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.219.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.219.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.220.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.220.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.220.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.220.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.220.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.220.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.221.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.221.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.221.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.221.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.221.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.221.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.222.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.222.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.222.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.222.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.222.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.222.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.223.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.223.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.223.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.223.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.223.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.223.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.224.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.224.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.224.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.224.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.224.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.224.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.225.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.225.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.225.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.225.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.225.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.225.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.226.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.226.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.226.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.226.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.226.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.226.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.227.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.227.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.227.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.227.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.227.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.227.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.228.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.228.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.228.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.228.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.228.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.228.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.229.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.229.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.229.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.229.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.229.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.229.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.230.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.230.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.230.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.230.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.230.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.230.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.231.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.231.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.231.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.231.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.231.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.231.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.232.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.232.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.232.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.232.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.232.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.232.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.233.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.233.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.233.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.233.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.233.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.233.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.234.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.234.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.234.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.234.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.234.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.234.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.235.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.235.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.235.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.235.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.235.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.235.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.236.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.236.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.236.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.236.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.236.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.236.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.237.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.237.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.237.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.237.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.237.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.237.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.238.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.238.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.238.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.238.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.238.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.238.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.239.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.239.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.239.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.239.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.239.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.239.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.240.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.240.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.240.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.240.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.240.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.240.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.241.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.241.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.241.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.241.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.241.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.241.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.242.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.242.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.242.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.242.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.242.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.242.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.243.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.243.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.243.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.243.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.243.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.243.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.244.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.244.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.244.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.244.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.244.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.244.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.245.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.245.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.245.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.245.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.245.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.245.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.246.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.246.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.246.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.246.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.246.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.246.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.247.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.247.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.247.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.247.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.247.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.247.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.248.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.248.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.248.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.248.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.248.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.248.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.249.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.249.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.249.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.249.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.249.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.249.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.250.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.250.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.250.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.250.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.250.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.250.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.251.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.251.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.251.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.251.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.251.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.251.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.252.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.252.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.252.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.252.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.252.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.252.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.253.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.253.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.253.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.253.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.253.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.253.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.254.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.254.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.254.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.254.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.254.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.254.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.255.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.255.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.255.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.255.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.255.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.255.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.input_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.51.post_attention_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.q_a_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.q_a_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.q_a_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.q_b_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.q_b_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.kv_b_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.kv_b_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.o_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.o_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.gate.weight": "model-00136-of-000163.safetensors", "model.layers.52.mlp.gate.e_score_correction_bias": "model-00136-of-000163.safetensors", "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.shared_experts.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.shared_experts.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.0.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.0.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.0.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.0.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.0.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.1.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.1.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.1.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.1.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.1.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.2.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.2.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.2.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.2.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.2.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.3.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.3.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.3.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.3.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.3.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.4.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.4.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.4.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.4.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.4.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.5.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.5.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.5.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.5.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.5.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.6.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.6.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.6.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.6.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.6.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.7.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.7.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.7.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.7.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.7.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.8.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.8.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.8.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.8.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.8.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.9.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.9.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.9.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.9.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.9.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.10.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.10.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.10.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.10.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.10.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.11.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.11.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.11.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.11.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.11.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.12.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.12.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.12.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.12.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.12.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.13.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.13.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.13.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.13.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.13.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.14.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.14.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.14.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.14.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.14.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.15.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.15.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.15.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.15.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.15.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.16.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.16.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.16.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.16.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.16.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.17.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.17.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.17.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.17.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.17.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.18.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.18.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.18.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.18.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.18.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.19.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.19.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.19.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.19.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.19.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.20.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.20.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.20.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.20.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.20.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.21.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.21.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.21.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.21.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.21.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.22.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.22.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.22.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.22.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.22.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.23.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.23.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.23.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.23.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.23.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.24.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.24.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.24.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.24.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.24.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.25.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.25.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.25.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.25.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.25.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.26.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.26.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.26.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.26.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.26.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.27.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.27.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.27.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.27.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.27.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.28.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.28.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.28.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.28.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.28.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.29.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.29.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.29.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.29.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.29.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.30.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.30.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.30.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.30.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.30.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.31.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.31.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.31.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.31.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.31.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.32.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.32.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.32.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.32.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.32.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.33.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.33.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.33.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.33.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.33.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.34.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.34.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.34.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.34.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.34.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.35.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.35.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.35.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.35.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.35.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.36.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.36.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.36.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.36.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.36.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.37.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.37.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.37.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.37.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.37.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.38.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.38.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.38.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.38.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.38.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.39.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.39.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.39.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.39.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.39.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.40.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.40.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.40.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.40.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.40.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.41.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.41.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.41.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.41.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.41.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.42.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.42.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.42.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.42.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.42.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.43.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.43.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.43.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.43.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.43.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.44.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.44.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.44.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.44.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.44.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.45.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.45.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.45.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.45.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.45.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.46.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.46.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.46.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.46.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.46.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.47.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.47.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.47.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.47.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.47.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.48.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.48.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.48.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.48.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.48.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.49.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.49.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.49.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.49.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.49.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.50.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.50.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.50.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.50.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.50.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.51.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.51.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.51.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.51.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.51.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.52.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.52.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.52.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.52.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.52.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.53.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.53.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.53.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.53.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.53.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.54.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.54.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.54.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.54.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.54.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.55.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.55.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.55.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.55.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.55.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.56.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.56.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.56.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.56.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.56.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.57.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.57.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.57.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.57.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.57.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.58.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.58.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.58.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.58.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.58.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.59.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.59.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.59.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.59.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.59.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.60.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.60.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.60.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.60.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.60.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.61.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.61.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.61.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.61.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.61.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.62.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.62.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.62.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.62.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.62.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.63.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.63.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.63.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.63.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.63.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.64.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.64.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.64.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.64.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.64.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.65.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.65.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.65.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.65.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.65.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.66.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.66.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.66.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.66.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.66.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.67.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.67.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.67.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.67.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.67.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.68.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.68.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.68.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.68.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.68.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.69.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.69.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.69.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.69.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.69.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.70.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.70.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.70.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.70.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.70.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.71.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.71.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.71.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.71.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.71.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.72.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.72.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.72.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.72.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.72.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.73.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.73.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.73.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.73.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.73.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.74.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.74.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.74.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.74.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.74.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.75.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.75.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.75.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.75.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.75.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.76.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.76.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.76.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.76.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.76.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.77.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.77.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.77.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.77.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.77.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.78.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.78.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.78.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.78.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.78.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.79.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.79.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.79.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.79.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.79.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.80.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.80.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.80.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.80.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.80.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.81.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.81.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.81.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.81.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.81.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.82.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.82.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.82.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.82.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.82.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.83.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.83.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.83.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.83.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.83.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.84.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.84.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.84.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.84.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.84.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.85.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.85.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.85.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.85.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.85.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.86.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.86.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.86.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.86.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.86.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.87.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.87.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.87.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.87.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.87.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.88.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.88.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.88.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.88.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.88.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.89.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.89.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.89.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.89.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.89.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.90.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.90.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.90.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.90.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.90.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.91.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.91.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.91.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.91.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.91.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.92.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.92.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.92.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.92.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.92.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.93.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.93.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.93.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.93.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.93.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.94.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.94.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.94.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.94.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.94.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.95.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.95.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.95.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.95.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.95.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.96.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.96.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.96.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.96.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.96.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.97.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.97.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.97.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.97.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.97.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.98.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.98.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.98.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.98.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.98.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.99.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.99.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.99.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.99.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.99.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.100.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.100.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.100.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.100.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.100.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.101.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.101.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.101.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.101.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.101.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.102.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.102.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.102.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.102.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.102.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.103.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.103.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.103.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.103.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.103.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.104.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.104.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.104.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.104.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.104.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.105.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.105.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.105.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.105.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.105.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.106.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.106.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.106.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.106.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.106.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.107.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.107.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.107.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.107.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.107.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.108.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.108.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.108.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.108.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.108.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.109.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.109.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.109.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.109.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.109.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.110.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.110.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.110.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.110.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.110.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.111.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.111.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.111.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.111.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.111.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.112.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.112.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.112.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.112.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.112.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.113.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.113.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.113.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.113.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.113.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.114.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.114.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.114.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.114.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.114.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.115.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.115.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.115.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.115.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.115.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.116.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.116.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.116.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.116.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.116.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.117.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.117.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.117.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.117.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.117.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.118.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.118.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.118.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.118.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.118.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.119.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.119.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.119.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.119.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.119.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.120.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.120.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.120.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.120.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.120.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.121.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.121.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.121.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.121.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.121.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.122.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.122.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.122.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.122.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.122.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.123.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.123.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.123.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.123.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.123.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.124.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.124.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.124.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.124.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.124.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.125.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.125.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.125.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.125.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.125.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.126.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.126.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.126.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.126.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.126.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.127.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.127.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.127.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.127.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.127.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.128.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.128.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.128.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.128.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.128.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.129.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.129.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.129.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.129.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.129.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.130.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.130.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.130.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.130.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.130.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.131.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.131.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.131.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.131.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.131.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.132.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.132.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.132.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.132.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.132.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.133.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.133.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.133.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.133.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.133.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.134.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.134.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.134.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.134.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.134.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.135.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.135.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.135.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.135.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.135.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.136.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.136.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.136.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.136.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.136.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.137.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.137.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.137.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.137.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.137.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.138.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.138.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.138.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.138.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.138.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.139.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.139.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.139.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.139.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.139.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.140.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.140.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.140.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.140.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.140.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.141.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.141.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.141.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.141.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.141.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.142.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.142.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.142.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.142.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.142.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.143.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.143.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.143.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.143.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.143.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.144.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.144.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.144.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.144.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.144.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.145.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.145.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.145.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.145.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.145.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.146.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.146.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.146.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.146.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.146.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.147.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.147.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.147.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.147.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.147.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.148.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.148.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.148.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.148.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.148.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.149.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.149.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.149.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.149.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.149.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.150.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.150.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.150.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.150.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.150.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.151.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.151.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.151.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.151.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.151.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.152.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.152.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.152.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.152.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.152.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.153.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.153.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.153.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.153.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.153.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.154.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.154.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.154.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.154.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.154.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.155.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.155.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.155.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.155.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.155.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.156.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.156.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.156.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.156.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.156.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.157.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.157.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.157.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.157.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.157.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.158.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.158.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.158.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.158.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.158.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.159.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.159.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.159.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.159.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.159.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.160.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.160.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.160.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.160.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.160.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.160.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.161.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.161.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.161.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.161.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.161.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.161.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.162.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.162.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.162.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.162.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.162.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.162.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.163.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.163.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.163.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.163.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.163.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.163.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.164.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.164.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.164.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.164.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.164.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.164.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.165.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.165.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.165.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.165.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.165.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.165.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.166.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.166.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.166.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.166.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.166.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.166.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.167.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.167.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.167.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.167.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.167.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.167.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.168.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.168.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.168.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.168.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.168.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.168.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.169.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.169.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.169.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.169.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.169.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.169.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.170.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.170.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.170.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.170.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.170.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.170.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.171.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.171.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.171.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.171.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.171.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.171.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.172.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.172.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.172.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.172.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.172.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.172.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.173.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.173.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.173.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.173.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.173.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.173.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.174.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.174.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.174.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.174.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.174.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.174.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.175.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.175.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.175.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.175.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.175.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.175.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.176.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.176.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.176.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.176.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.176.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.176.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.177.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.177.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.177.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.177.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.177.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.177.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.178.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.178.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.178.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.178.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.178.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.178.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.179.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.179.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.179.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.179.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.179.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.179.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.180.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.180.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.180.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.180.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.180.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.180.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.181.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.181.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.181.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.181.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.181.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.181.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.182.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.182.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.182.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.182.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.182.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.182.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.183.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.183.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.183.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.183.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.183.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.183.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.184.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.184.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.184.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.184.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.184.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.184.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.185.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.185.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.185.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.185.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.185.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.185.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.186.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.186.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.186.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.186.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.186.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.186.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.187.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.187.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.187.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.187.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.187.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.187.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.188.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.188.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.188.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.188.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.188.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.188.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.189.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.189.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.189.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.189.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.189.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.189.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.190.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.190.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.190.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.190.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.190.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.190.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.191.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.191.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.191.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.191.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.191.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.191.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.192.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.192.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.192.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.192.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.192.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.192.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.193.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.193.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.193.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.193.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.193.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.193.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.194.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.194.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.194.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.194.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.194.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.194.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.195.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.195.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.195.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.195.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.195.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.195.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.196.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.196.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.196.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.196.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.196.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.196.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.197.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.197.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.197.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.197.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.197.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.197.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.198.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.198.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.198.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.198.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.198.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.198.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.199.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.199.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.199.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.199.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.199.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.199.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.200.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.200.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.200.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.200.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.200.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.200.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.201.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.201.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.201.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.201.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.201.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.201.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.202.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.202.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.202.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.202.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.202.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.202.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.203.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.203.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.203.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.203.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.203.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.203.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.204.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.204.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.204.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.204.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.204.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.204.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.205.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.205.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.205.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.205.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.205.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.205.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.206.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.206.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.206.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.206.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.206.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.206.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.207.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.207.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.207.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.207.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.207.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.207.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.208.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.208.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.208.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.208.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.208.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.208.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.209.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.209.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.209.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.209.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.209.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.209.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.210.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.210.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.210.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.210.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.210.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.210.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.211.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.211.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.211.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.211.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.211.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.211.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.212.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.212.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.212.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.212.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.212.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.212.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.213.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.213.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.213.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.213.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.213.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.213.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.214.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.214.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.214.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.214.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.214.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.214.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.215.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.215.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.215.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.215.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.215.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.215.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.216.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.216.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.216.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.216.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.216.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.216.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.217.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.217.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.217.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.217.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.217.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.217.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.218.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.218.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.218.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.218.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.218.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.218.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.219.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.219.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.219.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.219.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.219.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.219.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.220.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.220.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.220.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.220.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.220.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.220.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.221.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.221.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.221.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.221.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.221.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.221.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.222.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.222.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.222.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.222.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.222.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.222.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.223.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.223.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.223.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.223.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.223.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.223.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.224.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.224.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.224.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.224.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.224.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.224.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.225.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.225.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.225.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.225.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.225.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.225.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.226.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.226.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.226.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.226.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.226.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.226.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.227.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.227.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.227.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.227.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.227.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.227.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.228.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.228.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.228.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.228.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.228.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.228.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.229.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.229.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.229.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.229.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.229.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.229.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.230.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.230.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.230.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.230.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.230.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.230.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.231.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.231.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.231.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.231.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.231.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.231.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.232.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.232.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.232.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.232.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.232.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.232.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.233.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.233.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.233.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.233.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.233.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.233.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.234.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.234.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.234.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.234.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.234.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.234.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.235.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.235.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.235.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.235.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.235.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.235.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.236.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.236.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.236.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.236.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.236.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.236.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.237.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.237.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.237.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.237.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.237.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.237.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.238.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.238.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.238.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.238.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.238.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.238.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.239.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.239.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.239.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.239.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.239.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.239.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.240.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.240.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.240.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.240.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.240.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.240.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.241.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.241.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.241.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.241.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.241.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.241.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.242.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.242.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.242.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.242.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.242.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.242.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.243.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.243.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.243.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.243.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.243.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.243.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.244.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.244.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.244.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.244.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.244.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.244.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.245.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.245.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.245.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.245.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.245.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.245.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.246.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.246.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.246.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.246.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.246.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.246.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.247.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.247.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.247.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.247.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.247.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.247.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.248.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.248.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.248.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.248.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.248.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.248.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.249.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.249.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.249.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.249.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.249.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.249.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.250.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.250.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.250.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.250.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.250.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.250.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.251.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.251.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.251.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.251.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.251.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.251.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.252.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.252.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.252.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.252.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.252.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.252.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.253.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.253.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.253.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.253.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.253.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.253.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.254.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.254.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.254.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.254.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.254.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.254.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.255.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.255.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.255.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.255.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.255.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.255.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.input_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.52.post_attention_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.q_a_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.q_a_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.q_a_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.q_b_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.q_b_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.kv_b_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.kv_b_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.o_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.o_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.gate.weight": "model-00139-of-000163.safetensors", "model.layers.53.mlp.gate.e_score_correction_bias": "model-00139-of-000163.safetensors", "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.shared_experts.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.shared_experts.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.0.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.0.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.0.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.0.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.0.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.1.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.1.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.1.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.1.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.1.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.2.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.2.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.2.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.2.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.2.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.3.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.3.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.3.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.3.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.3.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.4.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.4.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.4.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.4.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.4.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.5.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.5.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.5.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.5.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.5.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.6.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.6.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.6.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.6.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.6.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.7.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.7.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.7.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.7.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.7.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.8.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.8.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.8.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.8.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.8.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.9.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.9.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.9.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.9.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.9.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.10.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.10.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.10.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.10.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.10.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.11.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.11.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.11.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.11.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.11.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.12.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.12.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.12.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.12.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.12.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.13.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.13.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.13.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.13.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.13.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.14.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.14.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.14.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.14.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.14.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.15.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.15.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.15.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.15.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.15.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.16.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.16.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.16.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.16.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.16.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.17.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.17.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.17.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.17.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.17.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.18.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.18.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.18.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.18.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.18.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.19.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.19.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.19.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.19.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.19.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.20.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.20.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.20.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.20.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.20.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.21.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.21.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.21.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.21.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.21.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.22.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.22.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.22.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.22.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.22.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.23.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.23.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.23.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.23.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.23.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.24.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.24.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.24.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.24.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.24.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.25.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.25.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.25.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.25.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.25.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.26.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.26.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.26.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.26.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.26.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.27.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.27.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.27.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.27.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.27.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.28.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.28.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.28.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.28.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.28.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.29.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.29.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.29.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.29.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.29.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.30.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.30.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.30.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.30.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.30.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.31.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.31.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.31.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.31.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.31.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.32.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.32.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.32.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.32.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.32.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.33.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.33.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.33.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.33.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.33.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.34.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.34.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.34.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.34.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.34.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.35.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.35.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.35.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.35.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.35.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.36.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.36.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.36.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.36.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.36.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.37.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.37.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.37.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.37.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.37.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.38.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.38.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.38.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.38.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.38.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.39.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.39.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.39.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.39.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.39.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.40.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.40.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.40.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.40.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.40.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.41.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.41.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.41.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.41.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.41.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.42.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.42.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.42.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.42.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.42.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.43.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.43.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.43.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.43.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.43.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.44.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.44.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.44.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.44.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.44.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.45.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.45.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.45.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.45.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.45.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.46.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.46.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.46.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.46.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.46.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.47.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.47.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.47.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.47.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.47.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.48.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.48.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.48.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.48.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.48.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.49.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.49.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.49.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.49.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.49.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.50.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.50.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.50.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.50.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.50.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.51.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.51.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.51.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.51.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.51.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.52.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.52.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.52.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.52.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.52.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.53.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.53.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.53.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.53.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.53.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.54.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.54.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.54.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.54.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.54.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.55.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.55.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.55.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.55.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.55.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.56.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.56.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.56.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.56.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.56.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.57.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.57.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.57.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.57.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.57.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.58.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.58.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.58.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.58.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.58.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.59.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.59.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.59.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.59.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.59.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.60.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.60.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.60.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.60.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.60.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.61.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.61.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.61.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.61.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.61.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.62.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.62.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.62.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.62.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.62.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.63.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.63.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.63.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.63.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.63.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.64.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.64.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.64.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.64.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.64.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.65.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.65.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.65.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.65.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.65.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.66.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.66.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.66.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.66.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.66.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.67.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.67.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.67.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.67.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.67.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.68.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.68.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.68.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.68.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.68.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.69.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.69.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.69.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.69.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.69.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.70.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.70.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.70.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.70.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.70.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.71.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.71.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.71.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.71.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.71.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.72.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.72.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.72.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.72.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.72.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.73.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.73.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.73.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.73.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.73.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.74.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.74.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.74.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.74.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.74.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.75.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.75.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.75.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.75.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.75.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.76.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.76.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.76.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.76.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.76.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.77.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.77.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.77.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.77.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.77.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.78.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.78.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.78.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.78.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.78.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.79.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.79.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.79.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.79.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.79.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.80.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.80.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.80.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.80.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.80.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.81.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.81.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.81.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.81.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.81.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.82.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.82.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.82.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.82.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.82.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.83.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.83.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.83.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.83.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.83.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.84.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.84.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.84.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.84.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.84.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.85.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.85.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.85.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.85.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.85.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.86.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.86.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.86.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.86.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.86.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.87.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.87.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.87.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.87.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.87.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.88.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.88.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.88.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.88.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.88.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.89.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.89.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.89.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.89.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.89.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.90.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.90.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.90.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.90.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.90.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.91.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.91.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.91.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.91.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.91.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.92.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.92.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.92.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.92.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.92.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.93.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.93.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.93.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.93.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.93.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.94.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.94.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.94.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.94.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.94.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.95.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.95.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.95.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.95.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.95.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.96.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.96.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.96.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.96.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.96.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.97.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.97.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.97.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.97.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.97.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.98.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.98.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.98.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.98.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.98.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.99.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.99.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.99.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.99.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.99.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.100.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.100.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.100.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.100.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.100.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.101.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.101.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.101.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.101.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.101.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.102.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.102.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.102.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.102.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.102.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.103.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.103.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.103.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.103.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.103.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.104.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.104.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.104.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.104.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.104.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.105.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.105.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.105.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.105.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.105.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.106.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.106.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.106.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.106.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.106.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.107.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.107.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.107.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.107.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.107.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.108.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.108.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.108.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.108.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.108.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.109.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.109.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.109.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.109.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.109.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.110.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.110.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.110.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.110.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.110.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.111.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.111.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.111.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.111.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.111.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.112.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.112.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.112.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.112.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.112.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.113.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.113.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.113.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.113.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.113.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.114.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.114.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.114.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.114.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.114.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.115.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.115.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.115.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.115.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.115.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.116.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.116.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.116.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.116.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.116.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.117.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.117.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.117.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.117.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.117.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.118.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.118.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.118.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.118.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.118.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.119.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.119.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.119.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.119.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.119.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.120.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.120.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.120.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.120.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.120.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.121.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.121.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.121.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.121.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.121.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.122.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.122.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.122.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.122.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.122.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.123.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.123.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.123.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.123.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.123.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.124.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.124.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.124.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.124.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.124.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.125.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.125.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.125.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.125.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.125.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.126.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.126.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.126.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.126.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.126.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.127.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.127.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.127.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.127.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.127.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.128.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.128.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.128.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.128.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.128.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.129.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.129.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.129.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.129.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.129.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.130.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.130.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.130.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.130.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.130.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.131.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.131.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.131.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.131.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.131.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.132.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.132.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.132.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.132.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.132.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.133.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.133.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.133.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.133.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.133.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.134.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.134.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.134.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.134.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.134.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.135.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.135.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.135.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.135.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.135.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.136.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.136.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.136.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.136.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.136.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.137.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.137.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.137.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.137.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.137.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.138.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.138.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.138.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.138.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.138.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.139.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.139.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.139.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.139.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.139.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.140.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.140.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.140.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.140.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.140.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.141.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.141.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.141.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.141.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.141.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.142.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.142.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.142.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.142.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.142.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.143.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.143.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.143.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.143.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.143.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.144.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.144.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.144.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.144.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.144.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.145.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.145.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.145.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.145.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.145.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.146.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.146.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.146.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.146.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.146.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.147.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.147.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.147.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.147.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.147.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.148.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.148.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.148.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.148.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.148.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.149.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.149.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.149.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.149.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.149.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.150.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.150.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.150.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.150.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.150.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.151.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.151.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.151.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.151.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.151.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.152.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.152.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.152.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.152.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.152.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.153.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.153.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.153.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.153.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.153.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.154.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.154.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.154.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.154.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.154.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.155.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.155.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.155.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.155.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.155.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.156.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.156.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.156.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.156.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.156.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.157.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.157.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.157.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.157.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.157.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.158.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.158.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.158.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.158.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.158.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.159.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.159.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.159.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.159.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.159.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.160.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.160.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.160.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.160.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.160.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.160.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.161.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.161.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.161.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.161.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.161.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.161.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.162.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.162.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.162.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.162.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.162.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.162.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.163.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.163.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.163.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.163.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.163.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.163.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.164.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.164.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.164.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.164.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.164.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.164.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.165.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.165.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.165.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.165.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.165.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.165.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.166.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.166.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.166.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.166.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.166.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.166.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.167.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.167.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.167.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.167.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.167.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.167.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.168.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.168.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.168.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.168.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.168.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.168.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.169.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.169.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.169.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.169.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.169.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.169.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.170.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.170.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.170.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.170.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.170.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.170.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.171.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.171.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.171.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.171.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.171.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.171.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.172.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.172.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.172.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.172.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.172.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.172.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.173.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.173.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.173.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.173.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.173.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.173.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.174.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.174.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.174.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.174.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.174.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.174.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.175.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.175.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.175.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.175.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.175.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.175.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.176.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.176.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.176.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.176.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.176.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.176.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.177.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.177.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.177.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.177.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.177.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.177.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.178.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.178.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.178.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.178.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.178.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.178.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.179.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.179.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.179.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.179.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.179.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.179.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.180.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.180.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.180.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.180.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.180.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.180.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.181.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.181.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.181.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.181.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.181.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.181.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.182.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.182.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.182.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.182.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.182.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.182.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.183.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.183.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.183.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.183.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.183.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.183.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.184.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.184.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.184.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.184.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.184.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.184.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.185.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.185.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.185.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.185.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.185.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.185.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.186.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.186.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.186.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.186.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.186.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.186.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.187.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.187.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.187.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.187.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.187.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.187.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.188.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.188.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.188.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.188.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.188.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.188.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.189.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.189.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.189.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.189.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.189.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.189.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.190.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.190.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.190.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.190.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.190.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.190.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.191.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.191.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.191.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.191.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.191.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.191.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.192.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.192.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.192.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.192.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.192.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.192.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.193.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.193.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.193.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.193.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.193.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.193.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.194.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.194.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.194.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.194.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.194.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.194.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.195.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.195.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.195.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.195.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.195.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.195.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.196.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.196.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.196.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.196.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.196.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.196.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.197.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.197.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.197.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.197.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.197.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.197.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.198.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.198.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.198.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.198.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.198.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.198.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.199.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.199.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.199.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.199.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.199.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.199.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.200.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.200.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.200.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.200.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.200.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.200.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.201.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.201.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.201.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.201.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.201.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.201.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.202.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.202.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.202.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.202.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.202.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.202.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.203.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.203.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.203.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.203.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.203.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.203.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.204.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.204.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.204.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.204.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.204.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.204.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.205.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.205.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.205.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.205.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.205.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.205.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.206.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.206.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.206.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.206.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.206.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.206.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.207.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.207.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.207.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.207.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.207.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.207.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.208.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.208.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.208.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.208.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.208.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.208.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.209.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.209.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.209.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.209.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.209.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.209.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.210.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.210.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.210.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.210.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.210.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.210.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.211.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.211.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.211.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.211.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.211.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.211.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.212.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.212.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.212.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.212.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.212.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.212.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.213.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.213.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.213.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.213.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.213.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.213.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.214.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.214.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.214.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.214.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.214.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.214.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.215.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.215.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.215.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.215.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.215.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.215.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.216.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.216.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.216.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.216.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.216.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.216.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.217.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.217.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.217.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.217.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.217.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.217.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.218.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.218.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.218.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.218.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.218.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.218.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.219.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.219.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.219.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.219.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.219.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.219.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.220.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.220.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.220.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.220.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.220.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.220.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.221.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.221.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.221.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.221.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.221.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.221.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.222.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.222.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.222.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.222.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.222.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.222.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.223.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.223.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.223.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.223.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.223.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.223.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.224.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.224.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.224.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.224.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.224.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.224.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.225.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.225.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.225.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.225.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.225.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.225.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.226.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.226.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.226.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.226.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.226.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.226.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.227.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.227.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.227.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.227.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.227.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.227.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.228.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.228.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.228.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.228.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.228.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.228.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.229.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.229.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.229.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.229.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.229.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.229.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.230.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.230.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.230.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.230.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.230.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.230.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.231.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.231.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.231.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.231.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.231.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.231.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.232.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.232.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.232.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.232.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.232.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.232.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.233.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.233.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.233.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.233.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.233.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.233.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.234.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.234.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.234.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.234.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.234.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.234.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.235.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.235.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.235.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.235.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.235.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.235.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.236.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.236.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.236.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.236.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.236.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.236.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.237.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.237.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.237.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.237.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.237.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.237.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.238.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.238.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.238.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.238.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.238.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.238.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.239.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.239.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.239.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.239.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.239.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.239.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.240.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.240.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.240.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.240.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.240.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.240.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.241.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.241.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.241.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.241.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.241.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.241.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.242.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.242.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.242.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.242.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.242.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.242.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.243.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.243.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.243.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.243.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.243.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.243.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.244.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.244.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.244.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.244.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.244.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.244.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.245.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.245.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.245.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.245.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.245.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.245.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.246.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.246.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.246.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.246.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.246.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.246.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.247.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.247.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.247.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.247.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.247.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.247.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.248.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.248.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.248.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.248.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.248.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.248.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.249.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.249.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.249.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.249.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.249.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.249.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.250.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.250.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.250.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.250.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.250.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.250.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.251.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.251.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.251.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.251.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.251.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.251.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.252.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.252.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.252.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.252.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.252.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.252.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.253.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.253.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.253.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.253.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.253.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.253.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.254.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.254.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.254.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.254.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.254.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.254.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.255.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.255.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.255.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.255.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.255.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.255.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.input_layernorm.weight": "model-00141-of-000163.safetensors", "model.layers.53.post_attention_layernorm.weight": "model-00141-of-000163.safetensors", "model.layers.54.self_attn.q_a_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.q_a_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.q_a_layernorm.weight": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.q_b_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.q_b_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.kv_b_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.kv_b_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.o_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.o_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.gate.weight": "model-00142-of-000163.safetensors", "model.layers.54.mlp.gate.e_score_correction_bias": "model-00142-of-000163.safetensors", "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.shared_experts.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.shared_experts.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.0.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.0.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.0.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.0.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.0.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.1.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.1.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.1.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.1.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.1.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.2.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.2.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.2.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.2.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.2.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.3.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.3.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.3.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.3.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.3.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.4.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.4.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.4.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.4.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.4.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.5.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.5.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.5.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.5.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.5.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.6.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.6.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.6.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.6.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.6.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.7.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.7.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.7.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.7.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.7.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.8.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.8.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.8.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.8.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.8.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.9.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.9.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.9.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.9.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.9.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.10.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.10.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.10.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.10.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.10.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.11.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.11.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.11.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.11.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.11.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.12.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.12.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.12.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.12.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.12.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.13.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.13.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.13.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.13.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.13.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.14.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.14.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.14.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.14.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.14.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.15.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.15.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.15.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.15.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.15.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.16.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.16.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.16.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.16.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.16.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.17.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.17.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.17.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.17.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.17.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.18.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.18.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.18.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.18.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.18.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.19.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.19.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.19.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.19.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.19.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.20.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.20.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.20.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.20.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.20.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.21.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.21.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.21.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.21.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.21.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.22.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.22.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.22.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.22.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.22.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.23.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.23.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.23.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.23.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.23.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.24.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.24.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.24.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.24.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.24.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.25.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.25.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.25.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.25.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.25.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.26.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.26.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.26.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.26.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.26.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.27.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.27.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.27.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.27.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.27.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.28.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.28.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.28.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.28.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.28.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.29.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.29.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.29.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.29.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.29.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.30.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.30.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.30.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.30.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.30.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.31.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.31.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.31.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.31.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.31.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.32.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.32.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.32.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.32.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.32.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.33.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.33.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.33.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.33.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.33.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.34.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.34.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.34.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.34.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.34.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.35.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.35.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.35.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.35.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.35.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.36.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.36.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.36.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.36.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.36.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.37.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.37.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.37.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.37.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.37.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.38.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.38.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.38.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.38.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.38.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.39.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.39.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.39.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.39.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.39.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.40.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.40.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.40.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.40.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.40.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.41.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.41.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.41.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.41.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.41.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.42.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.42.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.42.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.42.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.42.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.43.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.43.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.43.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.43.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.43.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.44.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.44.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.44.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.44.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.44.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.45.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.45.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.45.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.45.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.45.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.46.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.46.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.46.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.46.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.46.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.47.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.47.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.47.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.47.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.47.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.48.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.48.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.48.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.48.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.48.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.49.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.49.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.49.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.49.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.49.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.50.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.50.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.50.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.50.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.50.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.51.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.51.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.51.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.51.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.51.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.52.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.52.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.52.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.52.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.52.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.53.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.53.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.53.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.53.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.53.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.54.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.54.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.54.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.54.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.54.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.55.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.55.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.55.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.55.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.55.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.56.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.56.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.56.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.56.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.56.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.57.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.57.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.57.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.57.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.57.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.58.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.58.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.58.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.58.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.58.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.59.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.59.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.59.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.59.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.59.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.60.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.60.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.60.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.60.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.60.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.61.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.61.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.61.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.61.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.61.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.62.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.62.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.62.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.62.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.62.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.63.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.63.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.63.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.63.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.63.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.64.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.64.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.64.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.64.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.64.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.65.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.65.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.65.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.65.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.65.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.66.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.66.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.66.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.66.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.66.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.67.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.67.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.67.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.67.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.67.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.68.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.68.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.68.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.68.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.68.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.69.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.69.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.69.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.69.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.69.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.70.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.70.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.70.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.70.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.70.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.71.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.71.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.71.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.71.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.71.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.72.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.72.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.72.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.72.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.72.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.73.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.73.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.73.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.73.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.73.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.74.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.74.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.74.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.74.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.74.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.75.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.75.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.75.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.75.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.75.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.76.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.76.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.76.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.76.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.76.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.77.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.77.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.77.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.77.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.77.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.78.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.78.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.78.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.78.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.78.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.79.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.79.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.79.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.79.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.79.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.80.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.80.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.80.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.80.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.80.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.81.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.81.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.81.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.81.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.81.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.82.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.82.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.82.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.82.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.82.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.83.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.83.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.83.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.83.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.83.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.84.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.84.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.84.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.84.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.84.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.85.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.85.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.85.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.85.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.85.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.86.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.86.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.86.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.86.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.86.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.87.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.87.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.87.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.87.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.87.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.88.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.88.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.88.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.88.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.88.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.89.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.89.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.89.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.89.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.89.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.90.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.90.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.90.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.90.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.90.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.91.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.91.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.91.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.91.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.91.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.92.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.92.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.92.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.92.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.92.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.93.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.93.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.93.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.93.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.93.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.94.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.94.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.94.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.94.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.94.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.95.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.95.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.95.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.95.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.95.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.96.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.96.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.96.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.96.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.96.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.97.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.97.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.97.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.97.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.97.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.98.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.98.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.98.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.98.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.98.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.99.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.99.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.99.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.99.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.99.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.100.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.100.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.100.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.100.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.100.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.101.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.101.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.101.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.101.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.101.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.102.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.102.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.102.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.102.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.102.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.103.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.103.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.103.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.103.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.103.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.104.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.104.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.104.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.104.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.104.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.105.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.105.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.105.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.105.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.105.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.106.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.106.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.106.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.106.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.106.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.107.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.107.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.107.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.107.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.107.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.108.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.108.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.108.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.108.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.108.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.109.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.109.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.109.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.109.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.109.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.110.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.110.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.110.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.110.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.110.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.111.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.111.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.111.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.111.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.111.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.112.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.112.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.112.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.112.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.112.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.113.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.113.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.113.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.113.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.113.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.114.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.114.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.114.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.114.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.114.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.115.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.115.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.115.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.115.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.115.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.116.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.116.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.116.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.116.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.116.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.117.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.117.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.117.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.117.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.117.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.118.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.118.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.118.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.118.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.118.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.119.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.119.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.119.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.119.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.119.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.120.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.120.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.120.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.120.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.120.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.121.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.121.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.121.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.121.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.121.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.122.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.122.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.122.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.122.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.122.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.123.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.123.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.123.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.123.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.123.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.124.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.124.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.124.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.124.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.124.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.125.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.125.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.125.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.125.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.125.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.126.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.126.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.126.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.126.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.126.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.127.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.127.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.127.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.127.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.127.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.128.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.128.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.128.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.128.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.128.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.129.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.129.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.129.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.129.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.129.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.130.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.130.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.130.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.130.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.130.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.131.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.131.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.131.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.131.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.131.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.132.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.132.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.132.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.132.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.132.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.133.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.133.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.133.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.133.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.133.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.134.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.134.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.134.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.134.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.134.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.135.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.135.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.135.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.135.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.135.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.136.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.136.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.136.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.136.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.136.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.137.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.137.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.137.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.137.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.137.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.138.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.138.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.138.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.138.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.138.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.139.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.139.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.139.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.139.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.139.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.140.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.140.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.140.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.140.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.140.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.141.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.141.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.141.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.141.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.141.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.142.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.142.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.142.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.142.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.142.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.143.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.143.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.143.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.143.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.143.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.144.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.144.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.144.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.144.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.144.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.145.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.145.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.145.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.145.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.145.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.146.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.146.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.146.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.146.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.146.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.147.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.147.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.147.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.147.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.147.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.148.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.148.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.148.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.148.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.148.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.149.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.149.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.149.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.149.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.149.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.150.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.150.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.150.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.150.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.150.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.151.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.151.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.151.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.151.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.151.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.152.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.152.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.152.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.152.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.152.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.153.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.153.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.153.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.153.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.153.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.154.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.154.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.154.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.154.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.154.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.155.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.155.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.155.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.155.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.155.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.156.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.156.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.156.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.156.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.156.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.157.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.157.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.157.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.157.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.157.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.158.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.158.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.158.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.158.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.158.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.159.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.159.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.159.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.159.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.159.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.160.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.160.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.160.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.160.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.160.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.160.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.161.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.161.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.161.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.161.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.161.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.161.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.162.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.162.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.162.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.162.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.162.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.162.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.163.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.163.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.163.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.163.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.163.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.163.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.164.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.164.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.164.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.164.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.164.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.164.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.165.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.165.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.165.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.165.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.165.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.165.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.166.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.166.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.166.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.166.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.166.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.166.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.167.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.167.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.167.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.167.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.167.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.167.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.168.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.168.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.168.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.168.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.168.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.168.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.169.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.169.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.169.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.169.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.169.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.169.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.170.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.170.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.170.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.170.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.170.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.170.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.171.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.171.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.171.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.171.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.171.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.171.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.172.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.172.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.172.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.172.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.172.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.172.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.173.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.173.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.173.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.173.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.173.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.173.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.174.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.174.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.174.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.174.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.174.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.174.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.175.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.175.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.175.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.175.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.175.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.175.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.176.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.176.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.176.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.176.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.176.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.176.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.177.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.177.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.177.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.177.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.177.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.177.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.178.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.178.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.178.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.178.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.178.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.178.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.179.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.179.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.179.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.179.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.179.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.179.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.180.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.180.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.180.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.180.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.180.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.180.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.181.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.181.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.181.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.181.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.181.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.181.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.182.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.182.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.182.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.182.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.182.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.182.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.183.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.183.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.183.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.183.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.183.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.183.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.184.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.184.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.184.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.184.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.184.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.184.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.185.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.185.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.185.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.185.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.185.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.185.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.186.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.186.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.186.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.186.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.186.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.186.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.187.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.187.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.187.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.187.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.187.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.187.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.188.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.188.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.188.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.188.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.188.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.188.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.189.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.189.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.189.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.189.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.189.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.189.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.190.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.190.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.190.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.190.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.190.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.190.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.191.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.191.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.191.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.191.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.191.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.191.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.192.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.192.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.192.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.192.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.192.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.192.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.193.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.193.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.193.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.193.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.193.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.193.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.194.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.194.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.194.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.194.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.194.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.194.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.195.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.195.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.195.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.195.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.195.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.195.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.196.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.196.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.196.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.196.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.196.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.196.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.197.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.197.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.197.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.197.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.197.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.197.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.198.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.198.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.198.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.198.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.198.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.198.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.199.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.199.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.199.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.199.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.199.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.199.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.200.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.200.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.200.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.200.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.200.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.200.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.201.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.201.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.201.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.201.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.201.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.201.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.202.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.202.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.202.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.202.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.202.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.202.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.203.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.203.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.203.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.203.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.203.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.203.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.204.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.204.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.204.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.204.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.204.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.204.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.205.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.205.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.205.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.205.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.205.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.205.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.206.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.206.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.206.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.206.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.206.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.206.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.207.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.207.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.207.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.207.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.207.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.207.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.208.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.208.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.208.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.208.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.208.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.208.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.209.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.209.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.209.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.209.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.209.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.209.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.210.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.210.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.210.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.210.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.210.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.210.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.211.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.211.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.211.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.211.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.211.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.211.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.212.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.212.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.212.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.212.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.212.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.212.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.213.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.213.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.213.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.213.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.213.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.213.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.214.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.214.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.214.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.214.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.214.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.214.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.215.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.215.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.215.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.215.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.215.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.215.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.216.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.216.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.216.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.216.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.216.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.216.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.217.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.217.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.217.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.217.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.217.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.217.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.218.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.218.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.218.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.218.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.218.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.218.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.219.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.219.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.219.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.219.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.219.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.219.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.220.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.220.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.220.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.220.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.220.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.220.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.221.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.221.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.221.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.221.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.221.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.221.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.222.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.222.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.222.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.222.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.222.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.222.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.223.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.223.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.223.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.223.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.223.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.223.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.224.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.224.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.224.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.224.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.224.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.224.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.225.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.225.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.225.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.225.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.225.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.225.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.226.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.226.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.226.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.226.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.226.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.226.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.227.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.227.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.227.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.227.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.227.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.227.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.228.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.228.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.228.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.228.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.228.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.228.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.229.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.229.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.229.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.229.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.229.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.229.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.230.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.230.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.230.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.230.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.230.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.230.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.231.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.231.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.231.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.231.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.231.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.231.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.232.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.232.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.232.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.232.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.232.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.232.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.233.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.233.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.233.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.233.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.233.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.233.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.234.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.234.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.234.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.234.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.234.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.234.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.235.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.235.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.235.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.235.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.235.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.235.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.236.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.236.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.236.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.236.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.236.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.236.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.237.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.237.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.237.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.237.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.237.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.237.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.238.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.238.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.238.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.238.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.238.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.238.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.239.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.239.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.239.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.239.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.239.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.239.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.240.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.240.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.240.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.240.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.240.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.240.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.241.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.241.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.241.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.241.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.241.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.241.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.242.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.242.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.242.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.242.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.242.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.242.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.243.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.243.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.243.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.243.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.243.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.243.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.244.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.244.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.244.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.244.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.244.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.244.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.245.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.245.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.245.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.245.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.245.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.245.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.246.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.246.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.246.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.246.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.246.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.246.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.247.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.247.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.247.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.247.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.247.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.247.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.248.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.248.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.248.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.248.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.248.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.248.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.249.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.249.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.249.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.249.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.249.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.249.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.250.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.250.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.250.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.250.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.250.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.250.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.251.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.251.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.251.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.251.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.251.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.251.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.252.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.252.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.252.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.252.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.252.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.252.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.253.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.253.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.253.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.253.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.253.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.253.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.254.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.254.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.254.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.254.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.254.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.254.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.255.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.255.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.255.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.255.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.255.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.255.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.input_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.54.post_attention_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.q_a_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.q_a_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.q_a_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.q_b_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.q_b_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.kv_b_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.kv_b_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.o_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.o_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.gate.weight": "model-00144-of-000163.safetensors", "model.layers.55.mlp.gate.e_score_correction_bias": "model-00144-of-000163.safetensors", "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.shared_experts.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.shared_experts.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.0.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.0.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.0.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.0.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.0.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.1.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.1.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.1.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.1.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.1.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.2.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.2.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.2.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.2.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.2.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.3.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.3.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.3.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.3.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.3.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.4.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.4.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.4.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.4.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.4.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.5.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.5.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.5.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.5.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.5.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.6.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.6.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.6.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.6.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.6.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.7.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.7.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.7.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.7.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.7.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.8.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.8.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.8.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.8.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.8.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.9.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.9.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.9.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.9.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.9.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.10.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.10.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.10.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.10.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.10.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.11.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.11.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.11.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.11.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.11.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.12.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.12.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.12.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.12.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.12.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.13.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.13.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.13.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.13.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.13.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.14.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.14.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.14.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.14.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.14.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.15.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.15.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.15.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.15.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.15.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.16.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.16.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.16.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.16.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.16.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.17.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.17.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.17.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.17.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.17.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.18.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.18.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.18.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.18.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.18.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.19.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.19.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.19.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.19.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.19.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.20.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.20.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.20.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.20.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.20.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.21.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.21.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.21.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.21.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.21.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.22.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.22.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.22.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.22.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.22.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.23.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.23.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.23.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.23.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.23.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.24.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.24.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.24.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.24.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.24.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.25.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.25.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.25.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.25.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.25.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.26.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.26.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.26.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.26.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.26.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.27.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.27.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.27.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.27.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.27.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.28.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.28.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.28.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.28.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.28.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.29.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.29.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.29.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.29.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.29.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.30.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.30.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.30.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.30.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.30.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.31.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.31.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.31.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.31.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.31.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.32.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.32.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.32.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.32.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.32.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.33.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.33.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.33.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.33.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.33.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.34.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.34.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.34.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.34.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.34.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.35.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.35.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.35.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.35.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.35.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.36.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.36.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.36.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.36.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.36.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.37.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.37.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.37.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.37.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.37.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.38.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.38.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.38.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.38.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.38.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.39.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.39.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.39.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.39.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.39.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.40.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.40.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.40.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.40.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.40.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.41.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.41.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.41.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.41.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.41.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.42.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.42.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.42.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.42.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.42.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.43.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.43.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.43.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.43.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.43.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.44.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.44.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.44.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.44.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.44.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.45.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.45.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.45.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.45.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.45.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.46.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.46.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.46.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.46.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.46.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.47.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.47.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.47.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.47.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.47.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.48.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.48.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.48.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.48.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.48.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.49.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.49.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.49.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.49.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.49.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.50.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.50.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.50.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.50.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.50.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.51.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.51.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.51.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.51.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.51.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.52.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.52.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.52.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.52.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.52.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.53.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.53.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.53.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.53.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.53.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.54.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.54.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.54.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.54.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.54.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.55.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.55.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.55.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.55.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.55.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.56.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.56.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.56.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.56.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.56.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.57.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.57.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.57.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.57.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.57.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.58.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.58.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.58.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.58.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.58.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.59.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.59.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.59.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.59.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.59.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.60.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.60.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.60.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.60.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.60.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.61.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.61.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.61.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.61.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.61.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.62.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.62.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.62.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.62.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.62.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.63.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.63.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.63.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.63.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.63.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.64.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.64.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.64.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.64.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.64.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.65.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.65.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.65.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.65.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.65.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.66.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.66.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.66.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.66.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.66.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.67.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.67.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.67.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.67.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.67.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.68.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.68.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.68.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.68.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.68.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.69.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.69.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.69.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.69.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.69.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.70.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.70.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.70.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.70.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.70.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.71.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.71.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.71.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.71.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.71.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.72.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.72.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.72.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.72.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.72.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.73.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.73.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.73.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.73.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.73.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.74.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.74.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.74.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.74.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.74.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.75.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.75.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.75.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.75.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.75.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.76.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.76.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.76.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.76.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.76.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.77.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.77.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.77.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.77.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.77.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.78.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.78.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.78.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.78.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.78.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.79.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.79.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.79.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.79.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.79.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.80.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.80.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.80.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.80.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.80.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.81.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.81.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.81.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.81.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.81.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.82.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.82.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.82.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.82.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.82.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.83.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.83.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.83.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.83.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.83.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.84.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.84.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.84.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.84.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.84.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.85.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.85.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.85.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.85.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.85.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.86.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.86.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.86.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.86.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.86.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.87.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.87.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.87.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.87.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.87.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.88.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.88.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.88.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.88.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.88.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.89.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.89.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.89.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.89.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.89.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.90.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.90.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.90.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.90.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.90.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.91.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.91.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.91.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.91.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.91.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.92.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.92.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.92.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.92.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.92.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.93.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.93.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.93.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.93.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.93.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.94.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.94.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.94.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.94.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.94.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.95.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.95.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.95.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.95.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.95.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.96.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.96.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.96.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.96.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.96.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.97.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.97.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.97.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.97.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.97.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.98.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.98.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.98.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.98.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.98.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.99.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.99.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.99.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.99.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.99.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.100.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.100.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.100.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.100.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.100.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.101.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.101.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.101.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.101.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.101.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.102.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.102.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.102.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.102.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.102.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.103.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.103.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.103.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.103.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.103.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.104.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.104.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.104.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.104.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.104.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.105.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.105.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.105.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.105.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.105.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.106.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.106.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.106.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.106.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.106.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.107.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.107.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.107.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.107.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.107.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.108.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.108.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.108.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.108.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.108.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.109.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.109.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.109.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.109.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.109.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.110.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.110.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.110.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.110.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.110.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.111.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.111.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.111.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.111.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.111.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.112.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.112.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.112.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.112.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.112.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.113.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.113.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.113.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.113.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.113.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.114.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.114.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.114.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.114.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.114.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.115.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.115.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.115.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.115.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.115.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.116.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.116.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.116.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.116.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.116.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.117.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.117.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.117.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.117.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.117.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.118.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.118.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.118.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.118.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.118.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.119.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.119.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.119.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.119.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.119.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.120.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.120.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.120.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.120.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.120.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.121.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.121.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.121.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.121.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.121.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.122.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.122.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.122.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.122.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.122.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.123.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.123.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.123.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.123.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.123.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.124.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.124.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.124.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.124.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.124.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.125.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.125.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.125.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.125.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.125.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.126.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.126.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.126.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.126.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.126.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.127.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.127.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.127.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.127.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.127.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.128.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.128.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.128.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.128.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.128.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.129.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.129.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.129.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.129.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.129.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.130.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.130.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.130.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.130.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.130.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.131.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.131.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.131.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.131.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.131.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.132.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.132.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.132.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.132.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.132.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.133.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.133.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.133.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.133.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.133.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.134.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.134.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.134.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.134.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.134.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.135.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.135.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.135.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.135.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.135.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.136.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.136.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.136.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.136.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.136.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.137.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.137.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.137.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.137.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.137.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.138.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.138.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.138.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.138.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.138.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.139.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.139.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.139.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.139.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.139.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.140.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.140.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.140.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.140.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.140.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.141.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.141.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.141.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.141.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.141.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.142.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.142.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.142.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.142.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.142.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.143.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.143.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.143.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.143.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.143.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.144.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.144.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.144.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.144.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.144.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.145.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.145.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.145.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.145.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.145.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.146.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.146.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.146.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.146.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.146.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.147.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.147.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.147.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.147.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.147.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.148.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.148.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.148.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.148.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.148.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.149.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.149.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.149.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.149.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.149.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.150.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.150.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.150.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.150.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.150.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.151.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.151.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.151.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.151.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.151.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.152.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.152.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.152.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.152.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.152.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.153.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.153.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.153.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.153.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.153.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.154.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.154.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.154.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.154.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.154.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.155.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.155.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.155.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.155.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.155.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.156.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.156.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.156.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.156.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.156.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.157.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.157.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.157.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.157.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.157.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.158.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.158.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.158.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.158.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.158.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.159.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.159.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.159.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.159.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.159.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.160.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.160.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.160.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.160.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.160.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.160.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.161.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.161.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.161.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.161.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.161.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.161.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.162.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.162.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.162.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.162.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.162.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.162.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.163.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.163.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.163.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.163.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.163.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.163.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.164.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.164.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.164.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.164.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.164.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.164.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.165.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.165.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.165.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.165.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.165.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.165.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.166.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.166.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.166.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.166.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.166.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.166.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.167.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.167.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.167.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.167.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.167.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.167.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.168.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.168.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.168.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.168.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.168.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.168.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.169.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.169.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.169.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.169.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.169.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.169.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.170.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.170.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.170.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.170.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.170.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.170.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.171.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.171.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.171.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.171.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.171.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.171.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.172.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.172.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.172.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.172.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.172.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.172.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.173.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.173.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.173.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.173.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.173.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.173.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.174.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.174.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.174.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.174.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.174.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.174.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.175.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.175.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.175.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.175.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.175.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.175.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.176.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.176.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.176.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.176.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.176.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.176.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.177.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.177.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.177.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.177.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.177.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.177.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.178.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.178.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.178.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.178.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.178.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.178.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.179.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.179.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.179.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.179.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.179.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.179.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.180.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.180.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.180.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.180.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.180.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.180.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.181.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.181.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.181.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.181.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.181.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.181.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.182.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.182.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.182.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.182.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.182.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.182.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.183.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.183.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.183.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.183.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.183.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.183.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.184.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.184.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.184.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.184.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.184.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.184.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.185.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.185.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.185.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.185.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.185.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.185.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.186.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.186.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.186.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.186.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.186.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.186.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.187.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.187.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.187.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.187.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.187.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.187.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.188.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.188.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.188.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.188.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.188.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.188.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.189.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.189.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.189.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.189.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.189.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.189.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.190.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.190.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.190.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.190.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.190.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.190.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.191.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.191.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.191.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.191.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.191.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.191.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.192.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.192.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.192.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.192.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.192.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.192.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.193.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.193.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.193.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.193.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.193.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.193.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.194.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.194.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.194.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.194.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.194.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.194.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.195.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.195.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.195.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.195.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.195.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.195.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.196.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.196.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.196.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.196.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.196.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.196.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.197.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.197.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.197.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.197.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.197.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.197.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.198.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.198.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.198.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.198.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.198.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.198.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.199.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.199.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.199.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.199.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.199.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.199.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.200.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.200.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.200.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.200.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.200.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.200.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.201.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.201.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.201.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.201.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.201.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.201.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.202.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.202.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.202.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.202.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.202.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.202.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.203.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.203.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.203.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.203.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.203.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.203.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.204.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.204.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.204.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.204.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.204.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.204.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.205.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.205.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.205.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.205.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.205.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.205.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.206.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.206.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.206.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.206.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.206.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.206.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.207.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.207.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.207.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.207.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.207.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.207.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.208.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.208.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.208.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.208.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.208.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.208.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.209.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.209.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.209.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.209.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.209.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.209.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.210.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.210.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.210.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.210.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.210.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.210.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.211.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.211.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.211.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.211.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.211.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.211.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.212.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.212.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.212.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.212.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.212.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.212.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.213.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.213.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.213.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.213.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.213.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.213.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.214.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.214.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.214.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.214.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.214.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.214.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.215.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.215.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.215.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.215.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.215.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.215.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.216.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.216.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.216.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.216.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.216.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.216.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.217.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.217.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.217.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.217.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.217.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.217.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.218.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.218.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.218.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.218.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.218.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.218.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.219.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.219.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.219.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.219.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.219.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.219.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.220.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.220.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.220.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.220.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.220.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.220.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.221.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.221.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.221.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.221.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.221.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.221.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.222.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.222.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.222.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.222.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.222.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.222.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.223.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.223.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.223.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.223.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.223.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.223.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.224.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.224.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.224.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.224.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.224.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.224.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.225.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.225.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.225.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.225.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.225.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.225.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.226.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.226.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.226.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.226.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.226.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.226.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.227.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.227.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.227.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.227.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.227.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.227.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.228.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.228.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.228.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.228.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.228.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.228.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.229.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.229.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.229.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.229.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.229.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.229.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.230.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.230.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.230.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.230.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.230.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.230.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.231.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.231.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.231.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.231.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.231.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.231.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.232.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.232.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.232.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.232.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.232.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.232.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.233.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.233.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.233.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.233.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.233.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.233.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.234.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.234.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.234.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.234.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.234.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.234.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.235.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.235.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.235.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.235.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.235.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.235.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.236.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.236.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.236.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.236.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.236.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.236.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.237.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.237.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.237.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.237.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.237.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.237.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.238.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.238.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.238.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.238.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.238.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.238.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.239.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.239.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.239.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.239.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.239.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.239.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.240.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.240.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.240.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.240.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.240.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.240.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.241.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.241.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.241.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.241.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.241.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.241.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.242.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.242.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.242.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.242.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.242.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.242.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.243.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.243.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.243.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.243.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.243.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.243.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.244.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.244.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.244.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.244.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.244.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.244.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.245.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.245.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.245.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.245.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.245.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.245.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.246.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.246.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.246.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.246.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.246.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.246.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.247.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.247.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.247.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.247.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.247.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.247.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.248.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.248.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.248.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.248.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.248.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.248.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.249.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.249.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.249.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.249.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.249.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.249.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.250.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.250.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.250.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.250.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.250.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.250.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.251.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.251.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.251.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.251.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.251.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.251.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.252.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.252.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.252.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.252.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.252.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.252.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.253.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.253.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.253.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.253.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.253.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.253.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.254.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.254.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.254.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.254.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.254.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.254.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.255.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.255.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.255.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.255.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.255.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.255.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.input_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.55.post_attention_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.q_a_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.q_a_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.q_a_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.q_b_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.q_b_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.kv_b_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.kv_b_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.o_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.o_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.gate.weight": "model-00147-of-000163.safetensors", "model.layers.56.mlp.gate.e_score_correction_bias": "model-00147-of-000163.safetensors", "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.shared_experts.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.shared_experts.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.0.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.0.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.0.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.0.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.0.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.1.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.1.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.1.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.1.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.1.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.2.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.2.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.2.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.2.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.2.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.3.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.3.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.3.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.3.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.3.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.4.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.4.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.4.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.4.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.4.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.5.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.5.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.5.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.5.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.5.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.6.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.6.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.6.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.6.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.6.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.7.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.7.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.7.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.7.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.7.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.8.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.8.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.8.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.8.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.8.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.9.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.9.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.9.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.9.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.9.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.10.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.10.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.10.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.10.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.10.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.11.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.11.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.11.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.11.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.11.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.12.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.12.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.12.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.12.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.12.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.13.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.13.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.13.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.13.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.13.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.14.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.14.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.14.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.14.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.14.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.15.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.15.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.15.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.15.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.15.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.16.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.16.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.16.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.16.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.16.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.17.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.17.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.17.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.17.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.17.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.18.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.18.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.18.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.18.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.18.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.19.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.19.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.19.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.19.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.19.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.20.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.20.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.20.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.20.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.20.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.21.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.21.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.21.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.21.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.21.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.22.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.22.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.22.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.22.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.22.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.23.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.23.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.23.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.23.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.23.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.24.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.24.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.24.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.24.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.24.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.25.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.25.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.25.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.25.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.25.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.26.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.26.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.26.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.26.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.26.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.27.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.27.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.27.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.27.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.27.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.28.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.28.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.28.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.28.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.28.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.29.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.29.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.29.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.29.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.29.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.30.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.30.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.30.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.30.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.30.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.31.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.31.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.31.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.31.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.31.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.32.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.32.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.32.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.32.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.32.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.33.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.33.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.33.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.33.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.33.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.34.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.34.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.34.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.34.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.34.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.35.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.35.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.35.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.35.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.35.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.36.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.36.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.36.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.36.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.36.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.37.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.37.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.37.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.37.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.37.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.38.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.38.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.38.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.38.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.38.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.39.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.39.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.39.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.39.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.39.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.40.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.40.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.40.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.40.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.40.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.41.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.41.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.41.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.41.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.41.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.42.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.42.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.42.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.42.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.42.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.43.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.43.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.43.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.43.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.43.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.44.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.44.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.44.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.44.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.44.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.45.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.45.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.45.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.45.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.45.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.46.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.46.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.46.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.46.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.46.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.47.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.47.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.47.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.47.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.47.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.48.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.48.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.48.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.48.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.48.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.49.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.49.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.49.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.49.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.49.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.50.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.50.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.50.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.50.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.50.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.51.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.51.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.51.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.51.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.51.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.52.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.52.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.52.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.52.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.52.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.53.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.53.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.53.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.53.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.53.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.54.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.54.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.54.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.54.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.54.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.55.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.55.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.55.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.55.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.55.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.56.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.56.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.56.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.56.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.56.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.57.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.57.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.57.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.57.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.57.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.58.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.58.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.58.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.58.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.58.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.59.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.59.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.59.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.59.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.59.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.60.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.60.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.60.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.60.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.60.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.61.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.61.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.61.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.61.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.61.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.62.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.62.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.62.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.62.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.62.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.63.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.63.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.63.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.63.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.63.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.64.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.64.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.64.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.64.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.64.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.65.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.65.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.65.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.65.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.65.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.66.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.66.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.66.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.66.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.66.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.67.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.67.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.67.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.67.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.67.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.68.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.68.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.68.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.68.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.68.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.69.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.69.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.69.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.69.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.69.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.70.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.70.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.70.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.70.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.70.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.71.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.71.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.71.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.71.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.71.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.72.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.72.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.72.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.72.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.72.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.73.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.73.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.73.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.73.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.73.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.74.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.74.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.74.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.74.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.74.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.75.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.75.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.75.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.75.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.75.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.76.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.76.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.76.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.76.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.76.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.77.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.77.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.77.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.77.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.77.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.78.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.78.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.78.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.78.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.78.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.79.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.79.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.79.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.79.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.79.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.80.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.80.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.80.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.80.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.80.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.81.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.81.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.81.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.81.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.81.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.82.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.82.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.82.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.82.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.82.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.83.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.83.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.83.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.83.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.83.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.84.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.84.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.84.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.84.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.84.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.85.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.85.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.85.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.85.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.85.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.86.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.86.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.86.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.86.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.86.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.87.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.87.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.87.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.87.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.87.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.88.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.88.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.88.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.88.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.88.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.89.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.89.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.89.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.89.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.89.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.90.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.90.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.90.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.90.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.90.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.91.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.91.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.91.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.91.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.91.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.92.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.92.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.92.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.92.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.92.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.93.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.93.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.93.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.93.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.93.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.94.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.94.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.94.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.94.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.94.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.95.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.95.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.95.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.95.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.95.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.96.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.96.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.96.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.96.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.96.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.97.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.97.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.97.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.97.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.97.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.98.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.98.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.98.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.98.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.98.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.99.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.99.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.99.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.99.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.99.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.100.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.100.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.100.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.100.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.100.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.101.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.101.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.101.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.101.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.101.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.102.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.102.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.102.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.102.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.102.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.103.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.103.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.103.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.103.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.103.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.104.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.104.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.104.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.104.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.104.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.105.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.105.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.105.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.105.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.105.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.106.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.106.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.106.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.106.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.106.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.107.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.107.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.107.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.107.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.107.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.108.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.108.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.108.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.108.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.108.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.109.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.109.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.109.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.109.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.109.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.110.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.110.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.110.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.110.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.110.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.111.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.111.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.111.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.111.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.111.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.112.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.112.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.112.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.112.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.112.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.113.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.113.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.113.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.113.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.113.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.114.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.114.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.114.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.114.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.114.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.115.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.115.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.115.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.115.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.115.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.116.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.116.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.116.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.116.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.116.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.117.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.117.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.117.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.117.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.117.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.118.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.118.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.118.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.118.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.118.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.119.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.119.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.119.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.119.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.119.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.120.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.120.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.120.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.120.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.120.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.121.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.121.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.121.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.121.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.121.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.122.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.122.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.122.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.122.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.122.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.123.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.123.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.123.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.123.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.123.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.124.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.124.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.124.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.124.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.124.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.125.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.125.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.125.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.125.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.125.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.126.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.126.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.126.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.126.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.126.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.127.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.127.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.127.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.127.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.127.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.128.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.128.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.128.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.128.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.128.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.129.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.129.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.129.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.129.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.129.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.130.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.130.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.130.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.130.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.130.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.131.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.131.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.131.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.131.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.131.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.132.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.132.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.132.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.132.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.132.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.133.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.133.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.133.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.133.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.133.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.134.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.134.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.134.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.134.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.134.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.135.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.135.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.135.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.135.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.135.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.136.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.136.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.136.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.136.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.136.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.137.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.137.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.137.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.137.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.137.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.138.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.138.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.138.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.138.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.138.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.139.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.139.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.139.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.139.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.139.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.140.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.140.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.140.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.140.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.140.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.141.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.141.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.141.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.141.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.141.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.142.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.142.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.142.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.142.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.142.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.143.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.143.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.143.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.143.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.143.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.144.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.144.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.144.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.144.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.144.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.145.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.145.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.145.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.145.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.145.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.146.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.146.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.146.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.146.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.146.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.147.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.147.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.147.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.147.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.147.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.148.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.148.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.148.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.148.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.148.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.149.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.149.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.149.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.149.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.149.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.150.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.150.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.150.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.150.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.150.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.151.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.151.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.151.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.151.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.151.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.152.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.152.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.152.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.152.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.152.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.153.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.153.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.153.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.153.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.153.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.154.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.154.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.154.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.154.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.154.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.155.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.155.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.155.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.155.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.155.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.156.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.156.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.156.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.156.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.156.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.157.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.157.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.157.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.157.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.157.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.158.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.158.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.158.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.158.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.158.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.159.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.159.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.159.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.159.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.159.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.160.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.160.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.160.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.160.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.160.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.160.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.161.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.161.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.161.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.161.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.161.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.161.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.162.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.162.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.162.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.162.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.162.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.162.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.163.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.163.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.163.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.163.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.163.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.163.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.164.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.164.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.164.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.164.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.164.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.164.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.165.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.165.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.165.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.165.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.165.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.165.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.166.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.166.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.166.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.166.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.166.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.166.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.167.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.167.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.167.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.167.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.167.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.167.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.168.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.168.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.168.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.168.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.168.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.168.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.169.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.169.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.169.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.169.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.169.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.169.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.170.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.170.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.170.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.170.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.170.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.170.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.171.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.171.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.171.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.171.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.171.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.171.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.172.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.172.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.172.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.172.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.172.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.172.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.173.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.173.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.173.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.173.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.173.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.173.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.174.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.174.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.174.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.174.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.174.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.174.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.175.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.175.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.175.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.175.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.175.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.175.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.176.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.176.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.176.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.176.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.176.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.176.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.177.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.177.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.177.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.177.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.177.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.177.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.178.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.178.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.178.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.178.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.178.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.178.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.179.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.179.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.179.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.179.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.179.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.179.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.180.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.180.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.180.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.180.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.180.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.180.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.181.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.181.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.181.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.181.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.181.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.181.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.182.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.182.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.182.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.182.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.182.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.182.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.183.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.183.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.183.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.183.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.183.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.183.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.184.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.184.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.184.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.184.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.184.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.184.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.185.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.185.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.185.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.185.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.185.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.185.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.186.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.186.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.186.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.186.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.186.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.186.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.187.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.187.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.187.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.187.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.187.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.187.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.188.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.188.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.188.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.188.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.188.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.188.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.189.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.189.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.189.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.189.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.189.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.189.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.190.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.190.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.190.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.190.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.190.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.190.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.191.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.191.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.191.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.191.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.191.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.191.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.192.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.192.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.192.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.192.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.192.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.192.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.193.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.193.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.193.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.193.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.193.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.193.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.194.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.194.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.194.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.194.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.194.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.194.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.195.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.195.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.195.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.195.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.195.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.195.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.196.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.196.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.196.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.196.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.196.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.196.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.197.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.197.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.197.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.197.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.197.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.197.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.198.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.198.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.198.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.198.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.198.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.198.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.199.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.199.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.199.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.199.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.199.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.199.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.200.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.200.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.200.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.200.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.200.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.200.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.201.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.201.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.201.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.201.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.201.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.201.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.202.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.202.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.202.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.202.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.202.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.202.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.203.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.203.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.203.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.203.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.203.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.203.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.204.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.204.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.204.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.204.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.204.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.204.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.205.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.205.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.205.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.205.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.205.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.205.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.206.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.206.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.206.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.206.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.206.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.206.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.207.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.207.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.207.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.207.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.207.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.207.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.208.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.208.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.208.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.208.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.208.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.208.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.209.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.209.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.209.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.209.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.209.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.209.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.210.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.210.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.210.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.210.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.210.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.210.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.211.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.211.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.211.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.211.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.211.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.211.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.212.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.212.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.212.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.212.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.212.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.212.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.213.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.213.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.213.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.213.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.213.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.213.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.214.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.214.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.214.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.214.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.214.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.214.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.215.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.215.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.215.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.215.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.215.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.215.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.216.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.216.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.216.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.216.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.216.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.216.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.217.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.217.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.217.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.217.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.217.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.217.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.218.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.218.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.218.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.218.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.218.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.218.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.219.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.219.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.219.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.219.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.219.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.219.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.220.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.220.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.220.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.220.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.220.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.220.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.221.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.221.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.221.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.221.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.221.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.221.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.222.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.222.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.222.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.222.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.222.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.222.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.223.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.223.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.223.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.223.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.223.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.223.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.224.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.224.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.224.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.224.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.224.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.224.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.225.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.225.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.225.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.225.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.225.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.225.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.226.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.226.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.226.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.226.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.226.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.226.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.227.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.227.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.227.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.227.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.227.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.227.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.228.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.228.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.228.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.228.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.228.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.228.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.229.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.229.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.229.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.229.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.229.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.229.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.230.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.230.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.230.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.230.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.230.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.230.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.231.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.231.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.231.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.231.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.231.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.231.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.232.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.232.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.232.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.232.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.232.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.232.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.233.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.233.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.233.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.233.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.233.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.233.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.234.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.234.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.234.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.234.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.234.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.234.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.235.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.235.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.235.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.235.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.235.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.235.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.236.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.236.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.236.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.236.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.236.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.236.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.237.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.237.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.237.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.237.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.237.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.237.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.238.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.238.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.238.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.238.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.238.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.238.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.239.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.239.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.239.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.239.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.239.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.239.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.240.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.240.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.240.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.240.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.240.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.240.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.241.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.241.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.241.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.241.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.241.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.241.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.242.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.242.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.242.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.242.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.242.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.242.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.243.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.243.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.243.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.243.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.243.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.243.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.244.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.244.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.244.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.244.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.244.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.244.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.245.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.245.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.245.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.245.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.245.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.245.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.246.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.246.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.246.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.246.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.246.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.246.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.247.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.247.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.247.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.247.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.247.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.247.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.248.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.248.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.248.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.248.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.248.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.248.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.249.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.249.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.249.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.249.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.249.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.249.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.250.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.250.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.250.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.250.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.250.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.250.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.251.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.251.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.251.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.251.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.251.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.251.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.252.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.252.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.252.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.252.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.252.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.252.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.253.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.253.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.253.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.253.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.253.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.253.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.254.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.254.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.254.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.254.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.254.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.254.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.255.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.255.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.255.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.255.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.255.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.255.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.input_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.56.post_attention_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.q_a_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.q_a_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.q_a_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.q_b_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.q_b_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.kv_b_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.kv_b_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.o_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.o_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.gate.weight": "model-00150-of-000163.safetensors", "model.layers.57.mlp.gate.e_score_correction_bias": "model-00150-of-000163.safetensors", "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.shared_experts.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.shared_experts.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.0.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.0.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.0.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.0.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.0.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.1.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.1.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.1.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.1.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.1.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.2.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.2.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.2.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.2.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.2.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.3.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.3.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.3.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.3.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.3.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.4.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.4.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.4.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.4.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.4.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.5.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.5.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.5.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.5.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.5.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.6.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.6.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.6.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.6.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.6.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.7.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.7.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.7.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.7.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.7.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.8.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.8.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.8.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.8.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.8.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.9.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.9.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.9.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.9.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.9.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.10.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.10.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.10.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.10.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.10.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.11.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.11.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.11.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.11.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.11.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.12.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.12.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.12.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.12.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.12.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.13.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.13.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.13.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.13.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.13.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.14.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.14.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.14.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.14.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.14.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.15.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.15.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.15.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.15.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.15.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.16.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.16.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.16.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.16.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.16.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.17.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.17.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.17.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.17.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.17.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.18.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.18.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.18.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.18.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.18.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.19.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.19.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.19.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.19.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.19.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.20.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.20.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.20.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.20.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.20.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.21.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.21.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.21.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.21.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.21.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.22.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.22.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.22.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.22.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.22.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.23.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.23.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.23.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.23.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.23.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.24.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.24.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.24.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.24.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.24.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.25.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.25.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.25.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.25.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.25.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.26.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.26.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.26.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.26.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.26.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.27.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.27.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.27.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.27.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.27.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.28.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.28.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.28.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.28.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.28.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.29.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.29.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.29.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.29.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.29.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.30.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.30.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.30.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.30.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.30.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.31.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.31.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.31.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.31.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.31.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.32.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.32.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.32.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.32.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.32.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.33.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.33.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.33.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.33.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.33.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.34.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.34.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.34.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.34.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.34.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.35.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.35.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.35.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.35.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.35.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.36.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.36.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.36.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.36.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.36.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.37.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.37.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.37.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.37.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.37.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.38.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.38.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.38.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.38.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.38.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.39.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.39.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.39.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.39.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.39.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.40.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.40.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.40.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.40.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.40.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.41.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.41.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.41.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.41.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.41.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.42.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.42.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.42.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.42.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.42.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.43.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.43.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.43.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.43.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.43.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.44.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.44.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.44.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.44.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.44.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.45.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.45.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.45.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.45.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.45.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.46.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.46.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.46.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.46.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.46.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.47.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.47.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.47.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.47.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.47.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.48.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.48.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.48.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.48.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.48.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.49.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.49.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.49.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.49.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.49.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.50.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.50.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.50.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.50.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.50.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.51.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.51.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.51.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.51.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.51.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.52.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.52.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.52.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.52.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.52.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.53.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.53.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.53.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.53.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.53.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.54.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.54.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.54.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.54.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.54.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.55.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.55.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.55.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.55.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.55.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.56.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.56.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.56.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.56.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.56.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.57.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.57.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.57.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.57.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.57.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.58.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.58.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.58.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.58.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.58.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.59.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.59.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.59.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.59.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.59.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.60.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.60.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.60.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.60.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.60.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.61.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.61.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.61.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.61.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.61.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.62.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.62.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.62.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.62.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.62.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.63.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.63.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.63.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.63.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.63.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.64.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.64.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.64.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.64.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.64.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.65.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.65.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.65.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.65.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.65.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.66.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.66.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.66.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.66.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.66.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.67.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.67.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.67.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.67.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.67.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.68.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.68.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.68.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.68.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.68.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.69.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.69.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.69.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.69.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.69.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.70.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.70.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.70.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.70.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.70.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.71.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.71.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.71.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.71.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.71.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.72.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.72.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.72.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.72.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.72.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.73.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.73.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.73.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.73.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.73.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.74.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.74.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.74.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.74.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.74.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.75.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.75.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.75.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.75.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.75.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.76.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.76.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.76.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.76.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.76.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.77.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.77.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.77.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.77.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.77.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.78.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.78.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.78.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.78.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.78.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.79.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.79.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.79.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.79.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.79.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.80.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.80.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.80.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.80.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.80.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.81.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.81.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.81.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.81.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.81.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.82.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.82.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.82.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.82.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.82.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.83.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.83.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.83.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.83.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.83.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.84.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.84.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.84.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.84.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.84.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.85.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.85.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.85.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.85.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.85.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.86.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.86.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.86.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.86.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.86.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.87.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.87.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.87.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.87.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.87.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.88.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.88.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.88.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.88.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.88.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.89.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.89.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.89.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.89.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.89.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.90.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.90.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.90.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.90.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.90.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.91.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.91.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.91.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.91.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.91.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.92.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.92.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.92.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.92.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.92.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.93.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.93.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.93.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.93.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.93.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.94.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.94.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.94.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.94.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.94.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.95.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.95.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.95.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.95.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.95.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.96.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.96.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.96.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.96.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.96.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.97.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.97.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.97.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.97.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.97.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.98.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.98.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.98.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.98.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.98.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.99.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.99.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.99.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.99.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.99.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.100.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.100.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.100.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.100.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.100.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.101.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.101.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.101.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.101.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.101.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.102.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.102.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.102.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.102.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.102.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.103.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.103.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.103.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.103.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.103.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.104.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.104.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.104.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.104.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.104.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.105.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.105.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.105.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.105.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.105.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.106.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.106.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.106.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.106.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.106.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.107.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.107.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.107.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.107.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.107.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.108.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.108.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.108.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.108.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.108.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.109.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.109.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.109.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.109.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.109.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.110.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.110.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.110.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.110.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.110.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.111.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.111.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.111.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.111.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.111.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.112.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.112.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.112.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.112.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.112.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.113.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.113.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.113.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.113.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.113.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.114.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.114.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.114.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.114.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.114.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.115.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.115.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.115.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.115.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.115.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.116.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.116.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.116.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.116.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.116.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.117.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.117.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.117.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.117.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.117.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.118.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.118.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.118.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.118.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.118.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.119.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.119.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.119.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.119.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.119.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.120.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.120.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.120.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.120.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.120.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.121.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.121.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.121.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.121.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.121.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.122.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.122.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.122.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.122.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.122.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.123.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.123.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.123.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.123.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.123.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.124.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.124.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.124.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.124.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.124.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.125.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.125.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.125.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.125.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.125.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.126.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.126.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.126.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.126.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.126.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.127.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.127.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.127.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.127.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.127.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.128.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.128.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.128.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.128.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.128.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.129.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.129.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.129.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.129.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.129.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.130.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.130.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.130.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.130.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.130.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.131.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.131.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.131.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.131.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.131.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.132.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.132.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.132.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.132.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.132.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.133.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.133.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.133.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.133.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.133.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.134.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.134.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.134.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.134.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.134.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.135.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.135.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.135.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.135.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.135.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.136.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.136.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.136.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.136.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.136.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.137.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.137.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.137.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.137.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.137.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.138.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.138.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.138.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.138.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.138.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.139.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.139.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.139.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.139.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.139.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.140.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.140.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.140.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.140.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.140.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.141.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.141.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.141.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.141.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.141.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.142.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.142.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.142.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.142.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.142.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.143.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.143.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.143.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.143.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.143.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.144.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.144.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.144.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.144.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.144.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.145.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.145.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.145.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.145.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.145.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.146.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.146.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.146.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.146.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.146.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.147.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.147.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.147.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.147.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.147.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.148.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.148.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.148.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.148.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.148.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.149.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.149.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.149.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.149.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.149.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.150.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.150.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.150.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.150.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.150.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.151.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.151.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.151.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.151.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.151.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.152.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.152.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.152.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.152.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.152.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.153.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.153.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.153.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.153.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.153.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.154.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.154.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.154.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.154.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.154.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.155.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.155.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.155.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.155.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.155.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.156.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.156.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.156.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.156.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.156.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.157.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.157.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.157.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.157.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.157.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.158.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.158.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.158.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.158.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.158.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.159.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.159.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.159.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.159.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.159.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.160.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.160.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.160.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.160.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.160.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.160.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.161.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.161.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.161.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.161.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.161.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.161.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.162.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.162.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.162.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.162.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.162.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.162.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.163.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.163.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.163.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.163.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.163.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.163.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.164.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.164.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.164.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.164.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.164.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.164.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.165.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.165.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.165.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.165.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.165.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.165.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.166.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.166.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.166.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.166.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.166.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.166.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.167.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.167.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.167.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.167.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.167.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.167.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.168.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.168.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.168.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.168.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.168.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.168.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.169.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.169.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.169.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.169.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.169.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.169.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.170.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.170.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.170.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.170.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.170.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.170.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.171.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.171.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.171.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.171.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.171.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.171.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.172.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.172.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.172.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.172.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.172.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.172.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.173.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.173.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.173.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.173.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.173.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.173.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.174.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.174.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.174.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.174.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.174.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.174.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.175.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.175.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.175.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.175.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.175.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.175.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.176.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.176.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.176.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.176.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.176.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.176.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.177.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.177.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.177.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.177.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.177.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.177.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.178.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.178.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.178.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.178.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.178.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.178.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.179.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.179.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.179.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.179.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.179.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.179.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.180.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.180.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.180.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.180.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.180.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.180.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.181.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.181.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.181.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.181.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.181.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.181.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.182.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.182.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.182.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.182.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.182.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.182.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.183.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.183.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.183.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.183.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.183.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.183.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.184.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.184.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.184.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.184.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.184.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.184.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.185.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.185.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.185.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.185.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.185.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.185.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.186.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.186.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.186.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.186.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.186.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.186.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.187.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.187.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.187.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.187.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.187.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.187.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.188.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.188.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.188.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.188.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.188.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.188.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.189.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.189.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.189.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.189.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.189.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.189.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.190.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.190.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.190.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.190.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.190.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.190.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.191.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.191.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.191.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.191.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.191.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.191.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.192.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.192.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.192.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.192.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.192.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.192.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.193.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.193.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.193.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.193.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.193.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.193.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.194.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.194.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.194.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.194.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.194.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.194.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.195.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.195.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.195.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.195.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.195.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.195.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.196.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.196.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.196.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.196.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.196.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.196.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.197.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.197.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.197.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.197.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.197.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.197.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.198.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.198.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.198.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.198.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.198.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.198.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.199.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.199.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.199.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.199.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.199.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.199.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.200.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.200.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.200.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.200.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.200.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.200.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.201.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.201.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.201.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.201.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.201.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.201.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.202.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.202.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.202.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.202.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.202.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.202.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.203.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.203.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.203.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.203.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.203.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.203.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.204.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.204.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.204.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.204.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.204.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.204.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.205.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.205.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.205.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.205.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.205.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.205.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.206.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.206.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.206.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.206.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.206.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.206.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.207.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.207.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.207.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.207.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.207.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.207.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.208.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.208.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.208.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.208.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.208.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.208.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.209.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.209.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.209.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.209.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.209.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.209.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.210.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.210.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.210.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.210.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.210.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.210.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.211.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.211.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.211.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.211.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.211.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.211.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.212.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.212.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.212.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.212.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.212.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.212.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.213.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.213.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.213.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.213.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.213.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.213.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.214.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.214.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.214.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.214.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.214.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.214.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.215.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.215.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.215.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.215.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.215.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.215.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.216.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.216.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.216.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.216.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.216.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.216.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.217.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.217.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.217.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.217.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.217.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.217.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.218.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.218.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.218.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.218.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.218.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.218.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.219.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.219.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.219.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.219.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.219.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.219.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.220.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.220.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.220.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.220.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.220.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.220.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.221.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.221.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.221.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.221.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.221.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.221.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.222.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.222.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.222.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.222.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.222.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.222.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.223.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.223.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.223.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.223.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.223.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.223.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.224.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.224.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.224.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.224.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.224.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.224.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.225.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.225.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.225.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.225.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.225.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.225.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.226.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.226.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.226.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.226.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.226.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.226.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.227.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.227.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.227.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.227.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.227.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.227.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.228.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.228.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.228.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.228.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.228.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.228.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.229.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.229.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.229.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.229.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.229.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.229.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.230.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.230.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.230.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.230.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.230.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.230.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.231.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.231.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.231.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.231.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.231.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.231.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.232.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.232.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.232.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.232.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.232.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.232.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.233.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.233.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.233.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.233.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.233.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.233.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.234.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.234.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.234.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.234.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.234.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.234.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.235.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.235.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.235.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.235.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.235.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.235.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.236.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.236.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.236.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.236.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.236.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.236.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.237.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.237.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.237.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.237.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.237.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.237.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.238.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.238.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.238.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.238.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.238.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.238.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.239.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.239.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.239.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.239.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.239.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.239.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.240.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.240.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.240.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.240.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.240.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.240.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.241.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.241.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.241.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.241.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.241.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.241.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.242.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.242.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.242.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.242.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.242.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.242.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.243.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.243.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.243.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.243.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.243.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.243.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.244.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.244.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.244.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.244.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.244.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.244.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.245.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.245.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.245.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.245.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.245.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.245.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.246.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.246.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.246.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.246.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.246.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.246.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.247.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.247.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.247.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.247.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.247.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.247.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.248.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.248.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.248.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.248.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.248.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.248.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.249.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.249.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.249.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.249.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.249.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.249.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.250.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.250.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.250.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.250.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.250.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.250.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.251.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.251.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.251.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.251.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.251.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.251.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.252.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.252.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.252.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.252.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.252.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.252.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.253.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.253.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.253.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.253.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.253.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.253.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.254.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.254.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.254.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.254.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.254.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.254.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.255.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.255.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.255.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.255.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.255.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.255.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.input_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.57.post_attention_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.q_a_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.q_a_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.q_a_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.q_b_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.q_b_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.kv_b_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.kv_b_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.o_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.o_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.gate.weight": "model-00152-of-000163.safetensors", "model.layers.58.mlp.gate.e_score_correction_bias": "model-00152-of-000163.safetensors", "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.shared_experts.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.shared_experts.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.0.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.0.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.0.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.0.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.0.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.1.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.1.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.1.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.1.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.1.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.2.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.2.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.2.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.2.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.2.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.3.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.3.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.3.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.3.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.3.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.4.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.4.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.4.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.4.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.4.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.5.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.5.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.5.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.5.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.5.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.6.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.6.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.6.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.6.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.6.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.7.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.7.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.7.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.7.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.7.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.8.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.8.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.8.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.8.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.8.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.9.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.9.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.9.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.9.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.9.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.10.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.10.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.10.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.10.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.10.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.11.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.11.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.11.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.11.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.11.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.12.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.12.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.12.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.12.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.12.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.13.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.13.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.13.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.13.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.13.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.14.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.14.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.14.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.14.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.14.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.15.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.15.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.15.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.15.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.15.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.16.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.16.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.16.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.16.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.16.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.17.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.17.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.17.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.17.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.17.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.18.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.18.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.18.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.18.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.18.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.19.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.19.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.19.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.19.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.19.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.20.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.20.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.20.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.20.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.20.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.21.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.21.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.21.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.21.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.21.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.22.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.22.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.22.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.22.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.22.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.23.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.23.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.23.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.23.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.23.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.24.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.24.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.24.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.24.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.24.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.25.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.25.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.25.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.25.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.25.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.26.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.26.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.26.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.26.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.26.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.27.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.27.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.27.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.27.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.27.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.28.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.28.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.28.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.28.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.28.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.29.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.29.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.29.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.29.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.29.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.30.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.30.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.30.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.30.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.30.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.31.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.31.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.31.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.31.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.31.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.32.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.32.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.32.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.32.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.32.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.33.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.33.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.33.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.33.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.33.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.34.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.34.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.34.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.34.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.34.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.35.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.35.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.35.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.35.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.35.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.36.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.36.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.36.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.36.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.36.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.37.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.37.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.37.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.37.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.37.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.38.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.38.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.38.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.38.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.38.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.39.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.39.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.39.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.39.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.39.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.40.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.40.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.40.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.40.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.40.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.41.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.41.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.41.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.41.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.41.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.42.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.42.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.42.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.42.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.42.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.43.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.43.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.43.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.43.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.43.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.44.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.44.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.44.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.44.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.44.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.45.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.45.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.45.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.45.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.45.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.46.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.46.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.46.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.46.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.46.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.47.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.47.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.47.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.47.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.47.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.48.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.48.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.48.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.48.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.48.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.49.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.49.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.49.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.49.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.49.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.50.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.50.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.50.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.50.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.50.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.51.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.51.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.51.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.51.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.51.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.52.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.52.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.52.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.52.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.52.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.53.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.53.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.53.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.53.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.53.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.54.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.54.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.54.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.54.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.54.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.55.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.55.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.55.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.55.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.55.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.56.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.56.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.56.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.56.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.56.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.57.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.57.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.57.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.57.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.57.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.58.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.58.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.58.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.58.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.58.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.59.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.59.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.59.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.59.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.59.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.60.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.60.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.60.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.60.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.60.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.61.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.61.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.61.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.61.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.61.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.62.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.62.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.62.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.62.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.62.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.63.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.63.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.63.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.63.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.63.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.64.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.64.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.64.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.64.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.64.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.65.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.65.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.65.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.65.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.65.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.66.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.66.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.66.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.66.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.66.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.67.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.67.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.67.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.67.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.67.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.68.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.68.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.68.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.68.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.68.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.69.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.69.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.69.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.69.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.69.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.70.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.70.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.70.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.70.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.70.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.71.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.71.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.71.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.71.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.71.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.72.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.72.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.72.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.72.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.72.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.73.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.73.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.73.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.73.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.73.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.74.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.74.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.74.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.74.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.74.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.75.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.75.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.75.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.75.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.75.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.76.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.76.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.76.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.76.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.76.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.77.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.77.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.77.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.77.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.77.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.78.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.78.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.78.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.78.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.78.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.79.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.79.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.79.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.79.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.79.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.80.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.80.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.80.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.80.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.80.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.81.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.81.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.81.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.81.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.81.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.82.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.82.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.82.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.82.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.82.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.83.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.83.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.83.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.83.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.83.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.84.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.84.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.84.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.84.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.84.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.85.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.85.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.85.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.85.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.85.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.86.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.86.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.86.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.86.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.86.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.87.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.87.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.87.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.87.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.87.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.88.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.88.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.88.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.88.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.88.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.89.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.89.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.89.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.89.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.89.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.90.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.90.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.90.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.90.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.90.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.91.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.91.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.91.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.91.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.91.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.92.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.92.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.92.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.92.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.92.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.93.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.93.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.93.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.93.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.93.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.94.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.94.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.94.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.94.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.94.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.95.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.95.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.95.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.95.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.95.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.96.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.96.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.96.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.96.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.96.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.97.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.97.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.97.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.97.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.97.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.98.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.98.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.98.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.98.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.98.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.99.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.99.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.99.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.99.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.99.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.100.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.100.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.100.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.100.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.100.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.101.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.101.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.101.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.101.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.101.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.102.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.102.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.102.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.102.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.102.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.103.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.103.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.103.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.103.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.103.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.104.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.104.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.104.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.104.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.104.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.105.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.105.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.105.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.105.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.105.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.106.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.106.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.106.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.106.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.106.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.107.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.107.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.107.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.107.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.107.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.108.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.108.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.108.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.108.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.108.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.109.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.109.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.109.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.109.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.109.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.110.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.110.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.110.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.110.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.110.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.111.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.111.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.111.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.111.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.111.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.112.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.112.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.112.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.112.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.112.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.113.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.113.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.113.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.113.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.113.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.114.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.114.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.114.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.114.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.114.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.115.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.115.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.115.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.115.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.115.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.116.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.116.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.116.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.116.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.116.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.117.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.117.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.117.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.117.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.117.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.118.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.118.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.118.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.118.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.118.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.119.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.119.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.119.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.119.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.119.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.120.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.120.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.120.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.120.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.120.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.121.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.121.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.121.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.121.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.121.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.122.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.122.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.122.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.122.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.122.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.123.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.123.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.123.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.123.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.123.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.124.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.124.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.124.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.124.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.124.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.125.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.125.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.125.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.125.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.125.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.126.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.126.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.126.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.126.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.126.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.127.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.127.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.127.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.127.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.127.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.128.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.128.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.128.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.128.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.128.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.129.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.129.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.129.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.129.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.129.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.130.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.130.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.130.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.130.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.130.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.131.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.131.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.131.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.131.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.131.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.132.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.132.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.132.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.132.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.132.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.133.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.133.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.133.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.133.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.133.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.134.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.134.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.134.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.134.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.134.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.135.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.135.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.135.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.135.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.135.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.136.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.136.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.136.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.136.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.136.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.137.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.137.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.137.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.137.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.137.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.138.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.138.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.138.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.138.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.138.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.139.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.139.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.139.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.139.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.139.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.140.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.140.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.140.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.140.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.140.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.141.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.141.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.141.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.141.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.141.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.142.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.142.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.142.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.142.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.142.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.143.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.143.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.143.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.143.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.143.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.144.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.144.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.144.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.144.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.144.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.145.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.145.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.145.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.145.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.145.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.146.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.146.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.146.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.146.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.146.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.147.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.147.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.147.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.147.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.147.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.148.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.148.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.148.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.148.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.148.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.149.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.149.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.149.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.149.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.149.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.150.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.150.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.150.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.150.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.150.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.151.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.151.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.151.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.151.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.151.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.152.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.152.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.152.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.152.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.152.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.153.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.153.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.153.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.153.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.153.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.154.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.154.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.154.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.154.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.154.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.155.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.155.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.155.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.155.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.155.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.156.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.156.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.156.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.156.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.156.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.157.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.157.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.157.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.157.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.157.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.158.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.158.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.158.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.158.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.158.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.159.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.159.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.159.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.159.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.159.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.160.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.160.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.160.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.160.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.160.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.160.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.161.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.161.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.161.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.161.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.161.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.161.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.162.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.162.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.162.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.162.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.162.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.162.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.163.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.163.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.163.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.163.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.163.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.163.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.164.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.164.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.164.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.164.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.164.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.164.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.165.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.165.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.165.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.165.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.165.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.165.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.166.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.166.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.166.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.166.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.166.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.166.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.167.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.167.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.167.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.167.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.167.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.167.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.168.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.168.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.168.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.168.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.168.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.168.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.169.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.169.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.169.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.169.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.169.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.169.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.170.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.170.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.170.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.170.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.170.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.170.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.171.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.171.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.171.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.171.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.171.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.171.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.172.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.172.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.172.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.172.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.172.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.172.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.173.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.173.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.173.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.173.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.173.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.173.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.174.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.174.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.174.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.174.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.174.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.174.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.175.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.175.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.175.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.175.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.175.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.175.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.176.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.176.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.176.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.176.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.176.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.176.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.177.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.177.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.177.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.177.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.177.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.177.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.178.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.178.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.178.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.178.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.178.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.178.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.179.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.179.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.179.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.179.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.179.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.179.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.180.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.180.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.180.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.180.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.180.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.180.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.181.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.181.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.181.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.181.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.181.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.181.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.182.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.182.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.182.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.182.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.182.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.182.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.183.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.183.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.183.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.183.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.183.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.183.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.184.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.184.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.184.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.184.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.184.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.184.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.185.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.185.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.185.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.185.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.185.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.185.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.186.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.186.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.186.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.186.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.186.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.186.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.187.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.187.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.187.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.187.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.187.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.187.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.188.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.188.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.188.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.188.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.188.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.188.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.189.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.189.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.189.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.189.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.189.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.189.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.190.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.190.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.190.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.190.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.190.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.190.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.191.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.191.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.191.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.191.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.191.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.191.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.192.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.192.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.192.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.192.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.192.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.192.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.193.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.193.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.193.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.193.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.193.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.193.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.194.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.194.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.194.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.194.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.194.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.194.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.195.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.195.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.195.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.195.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.195.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.195.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.196.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.196.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.196.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.196.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.196.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.196.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.197.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.197.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.197.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.197.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.197.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.197.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.198.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.198.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.198.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.198.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.198.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.198.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.199.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.199.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.199.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.199.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.199.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.199.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.200.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.200.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.200.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.200.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.200.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.200.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.201.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.201.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.201.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.201.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.201.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.201.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.202.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.202.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.202.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.202.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.202.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.202.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.203.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.203.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.203.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.203.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.203.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.203.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.204.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.204.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.204.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.204.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.204.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.204.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.205.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.205.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.205.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.205.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.205.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.205.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.206.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.206.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.206.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.206.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.206.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.206.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.207.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.207.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.207.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.207.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.207.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.207.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.208.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.208.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.208.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.208.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.208.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.208.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.209.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.209.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.209.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.209.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.209.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.209.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.210.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.210.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.210.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.210.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.210.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.210.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.211.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.211.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.211.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.211.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.211.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.211.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.212.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.212.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.212.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.212.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.212.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.212.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.213.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.213.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.213.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.213.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.213.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.213.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.214.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.214.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.214.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.214.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.214.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.214.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.215.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.215.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.215.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.215.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.215.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.215.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.216.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.216.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.216.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.216.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.216.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.216.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.217.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.217.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.217.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.217.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.217.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.217.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.218.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.218.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.218.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.218.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.218.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.218.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.219.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.219.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.219.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.219.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.219.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.219.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.220.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.220.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.220.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.220.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.220.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.220.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.221.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.221.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.221.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.221.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.221.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.221.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.222.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.222.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.222.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.222.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.222.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.222.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.223.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.223.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.223.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.223.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.223.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.223.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.224.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.224.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.224.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.224.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.224.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.224.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.225.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.225.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.225.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.225.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.225.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.225.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.226.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.226.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.226.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.226.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.226.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.226.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.227.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.227.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.227.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.227.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.227.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.227.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.228.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.228.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.228.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.228.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.228.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.228.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.229.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.229.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.229.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.229.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.229.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.229.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.230.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.230.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.230.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.230.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.230.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.230.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.231.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.231.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.231.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.231.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.231.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.231.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.232.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.232.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.232.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.232.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.232.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.232.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.233.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.233.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.233.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.233.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.233.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.233.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.234.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.234.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.234.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.234.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.234.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.234.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.235.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.235.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.235.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.235.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.235.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.235.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.236.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.236.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.236.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.236.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.236.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.236.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.237.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.237.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.237.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.237.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.237.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.237.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.238.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.238.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.238.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.238.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.238.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.238.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.239.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.239.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.239.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.239.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.239.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.239.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.240.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.240.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.240.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.240.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.240.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.240.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.241.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.241.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.241.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.241.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.241.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.241.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.242.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.242.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.242.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.242.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.242.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.242.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.243.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.243.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.243.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.243.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.243.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.243.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.244.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.244.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.244.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.244.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.244.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.244.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.245.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.245.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.245.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.245.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.245.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.245.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.246.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.246.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.246.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.246.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.246.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.246.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.247.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.247.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.247.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.247.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.247.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.247.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.248.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.248.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.248.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.248.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.248.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.248.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.249.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.249.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.249.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.249.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.249.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.249.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.250.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.250.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.250.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.250.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.250.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.250.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.251.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.251.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.251.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.251.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.251.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.251.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.252.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.252.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.252.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.252.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.252.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.252.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.253.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.253.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.253.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.253.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.253.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.253.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.254.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.254.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.254.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.254.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.254.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.254.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.255.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.255.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.255.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.255.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.255.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.255.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.input_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.58.post_attention_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.q_a_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.q_a_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.q_a_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.q_b_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.q_b_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.kv_b_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.kv_b_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.o_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.o_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.gate.weight": "model-00155-of-000163.safetensors", "model.layers.59.mlp.gate.e_score_correction_bias": "model-00155-of-000163.safetensors", "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.shared_experts.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.shared_experts.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.0.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.0.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.0.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.0.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.0.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.1.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.1.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.1.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.1.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.1.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.2.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.2.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.2.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.2.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.2.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.3.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.3.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.3.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.3.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.3.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.4.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.4.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.4.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.4.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.4.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.5.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.5.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.5.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.5.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.5.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.6.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.6.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.6.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.6.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.6.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.7.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.7.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.7.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.7.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.7.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.8.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.8.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.8.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.8.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.8.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.9.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.9.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.9.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.9.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.9.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.10.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.10.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.10.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.10.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.10.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.11.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.11.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.11.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.11.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.11.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.12.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.12.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.12.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.12.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.12.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.13.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.13.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.13.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.13.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.13.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.14.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.14.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.14.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.14.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.14.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.15.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.15.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.15.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.15.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.15.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.16.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.16.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.16.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.16.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.16.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.17.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.17.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.17.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.17.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.17.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.18.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.18.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.18.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.18.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.18.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.19.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.19.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.19.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.19.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.19.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.20.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.20.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.20.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.20.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.20.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.21.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.21.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.21.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.21.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.21.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.22.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.22.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.22.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.22.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.22.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.23.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.23.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.23.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.23.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.23.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.24.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.24.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.24.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.24.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.24.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.25.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.25.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.25.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.25.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.25.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.26.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.26.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.26.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.26.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.26.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.27.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.27.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.27.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.27.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.27.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.28.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.28.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.28.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.28.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.28.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.29.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.29.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.29.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.29.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.29.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.30.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.30.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.30.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.30.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.30.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.31.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.31.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.31.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.31.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.31.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.32.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.32.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.32.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.32.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.32.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.33.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.33.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.33.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.33.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.33.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.34.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.34.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.34.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.34.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.34.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.35.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.35.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.35.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.35.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.35.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.36.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.36.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.36.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.36.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.36.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.37.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.37.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.37.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.37.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.37.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.38.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.38.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.38.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.38.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.38.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.39.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.39.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.39.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.39.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.39.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.40.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.40.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.40.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.40.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.40.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.41.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.41.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.41.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.41.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.41.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.42.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.42.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.42.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.42.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.42.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.43.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.43.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.43.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.43.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.43.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.44.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.44.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.44.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.44.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.44.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.45.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.45.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.45.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.45.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.45.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.46.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.46.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.46.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.46.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.46.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.47.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.47.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.47.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.47.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.47.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.48.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.48.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.48.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.48.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.48.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.49.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.49.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.49.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.49.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.49.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.50.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.50.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.50.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.50.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.50.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.51.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.51.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.51.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.51.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.51.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.52.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.52.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.52.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.52.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.52.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.53.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.53.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.53.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.53.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.53.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.54.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.54.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.54.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.54.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.54.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.55.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.55.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.55.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.55.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.55.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.56.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.56.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.56.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.56.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.56.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.57.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.57.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.57.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.57.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.57.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.58.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.58.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.58.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.58.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.58.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.59.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.59.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.59.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.59.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.59.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.60.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.60.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.60.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.60.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.60.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.61.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.61.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.61.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.61.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.61.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.62.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.62.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.62.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.62.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.62.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.63.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.63.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.63.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.63.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.63.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.64.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.64.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.64.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.64.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.64.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.65.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.65.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.65.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.65.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.65.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.66.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.66.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.66.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.66.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.66.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.67.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.67.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.67.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.67.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.67.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.68.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.68.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.68.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.68.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.68.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.69.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.69.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.69.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.69.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.69.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.70.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.70.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.70.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.70.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.70.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.71.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.71.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.71.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.71.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.71.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.72.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.72.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.72.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.72.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.72.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.73.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.73.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.73.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.73.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.73.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.74.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.74.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.74.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.74.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.74.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.75.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.75.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.75.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.75.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.75.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.76.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.76.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.76.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.76.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.76.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.77.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.77.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.77.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.77.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.77.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.78.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.78.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.78.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.78.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.78.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.79.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.79.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.79.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.79.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.79.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.80.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.80.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.80.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.80.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.80.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.81.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.81.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.81.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.81.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.81.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.82.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.82.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.82.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.82.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.82.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.83.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.83.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.83.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.83.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.83.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.84.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.84.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.84.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.84.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.84.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.85.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.85.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.85.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.85.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.85.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.86.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.86.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.86.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.86.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.86.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.87.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.87.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.87.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.87.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.87.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.88.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.88.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.88.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.88.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.88.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.89.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.89.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.89.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.89.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.89.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.90.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.90.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.90.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.90.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.90.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.91.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.91.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.91.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.91.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.91.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.92.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.92.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.92.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.92.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.92.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.93.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.93.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.93.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.93.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.93.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.94.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.94.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.94.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.94.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.94.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.95.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.95.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.95.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.95.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.95.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.96.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.96.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.96.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.96.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.96.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.97.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.97.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.97.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.97.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.97.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.98.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.98.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.98.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.98.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.98.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.99.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.99.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.99.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.99.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.99.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.100.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.100.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.100.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.100.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.100.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.101.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.101.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.101.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.101.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.101.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.102.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.102.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.102.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.102.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.102.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.103.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.103.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.103.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.103.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.103.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.104.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.104.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.104.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.104.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.104.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.105.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.105.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.105.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.105.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.105.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.106.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.106.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.106.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.106.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.106.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.107.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.107.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.107.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.107.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.107.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.108.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.108.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.108.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.108.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.108.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.109.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.109.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.109.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.109.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.109.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.110.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.110.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.110.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.110.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.110.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.111.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.111.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.111.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.111.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.111.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.112.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.112.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.112.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.112.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.112.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.113.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.113.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.113.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.113.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.113.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.114.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.114.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.114.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.114.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.114.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.115.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.115.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.115.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.115.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.115.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.116.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.116.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.116.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.116.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.116.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.117.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.117.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.117.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.117.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.117.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.118.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.118.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.118.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.118.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.118.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.119.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.119.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.119.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.119.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.119.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.120.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.120.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.120.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.120.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.120.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.121.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.121.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.121.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.121.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.121.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.122.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.122.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.122.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.122.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.122.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.123.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.123.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.123.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.123.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.123.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.124.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.124.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.124.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.124.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.124.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.125.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.125.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.125.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.125.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.125.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.126.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.126.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.126.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.126.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.126.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.127.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.127.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.127.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.127.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.127.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.128.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.128.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.128.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.128.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.128.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.129.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.129.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.129.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.129.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.129.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.130.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.130.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.130.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.130.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.130.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.131.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.131.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.131.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.131.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.131.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.132.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.132.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.132.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.132.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.132.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.133.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.133.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.133.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.133.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.133.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.134.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.134.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.134.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.134.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.134.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.135.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.135.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.135.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.135.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.135.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.136.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.136.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.136.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.136.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.136.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.137.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.137.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.137.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.137.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.137.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.138.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.138.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.138.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.138.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.138.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.139.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.139.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.139.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.139.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.139.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.140.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.140.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.140.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.140.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.140.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.141.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.141.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.141.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.141.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.141.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.142.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.142.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.142.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.142.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.142.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.143.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.143.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.143.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.143.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.143.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.144.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.144.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.144.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.144.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.144.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.145.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.145.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.145.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.145.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.145.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.146.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.146.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.146.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.146.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.146.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.147.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.147.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.147.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.147.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.147.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.148.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.148.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.148.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.148.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.148.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.149.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.149.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.149.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.149.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.149.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.150.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.150.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.150.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.150.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.150.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.151.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.151.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.151.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.151.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.151.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.152.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.152.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.152.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.152.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.152.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.153.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.153.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.153.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.153.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.153.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.154.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.154.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.154.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.154.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.154.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.155.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.155.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.155.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.155.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.155.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.156.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.156.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.156.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.156.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.156.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.157.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.157.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.157.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.157.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.157.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.158.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.158.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.158.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.158.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.158.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.159.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.159.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.159.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.159.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.159.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.160.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.160.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.160.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.160.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.160.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.160.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.161.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.161.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.161.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.161.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.161.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.161.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.162.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.162.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.162.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.162.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.162.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.162.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.163.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.163.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.163.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.163.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.163.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.163.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.164.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.164.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.164.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.164.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.164.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.164.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.165.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.165.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.165.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.165.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.165.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.165.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.166.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.166.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.166.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.166.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.166.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.166.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.167.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.167.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.167.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.167.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.167.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.167.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.168.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.168.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.168.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.168.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.168.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.168.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.169.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.169.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.169.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.169.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.169.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.169.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.170.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.170.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.170.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.170.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.170.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.170.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.171.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.171.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.171.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.171.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.171.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.171.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.172.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.172.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.172.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.172.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.172.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.172.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.173.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.173.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.173.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.173.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.173.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.173.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.174.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.174.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.174.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.174.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.174.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.174.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.175.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.175.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.175.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.175.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.175.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.175.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.176.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.176.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.176.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.176.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.176.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.176.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.177.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.177.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.177.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.177.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.177.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.177.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.178.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.178.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.178.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.178.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.178.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.178.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.179.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.179.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.179.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.179.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.179.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.179.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.180.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.180.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.180.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.180.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.180.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.180.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.181.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.181.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.181.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.181.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.181.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.181.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.182.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.182.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.182.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.182.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.182.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.182.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.183.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.183.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.183.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.183.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.183.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.183.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.184.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.184.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.184.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.184.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.184.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.184.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.185.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.185.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.185.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.185.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.185.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.185.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.186.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.186.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.186.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.186.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.186.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.186.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.187.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.187.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.187.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.187.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.187.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.187.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.188.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.188.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.188.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.188.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.188.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.188.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.189.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.189.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.189.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.189.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.189.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.189.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.190.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.190.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.190.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.190.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.190.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.190.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.191.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.191.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.191.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.191.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.191.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.191.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.192.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.192.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.192.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.192.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.192.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.192.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.193.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.193.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.193.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.193.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.193.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.193.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.194.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.194.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.194.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.194.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.194.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.194.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.195.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.195.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.195.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.195.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.195.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.195.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.196.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.196.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.196.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.196.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.196.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.196.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.197.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.197.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.197.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.197.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.197.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.197.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.198.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.198.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.198.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.198.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.198.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.198.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.199.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.199.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.199.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.199.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.199.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.199.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.200.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.200.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.200.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.200.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.200.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.200.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.201.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.201.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.201.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.201.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.201.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.201.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.202.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.202.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.202.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.202.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.202.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.202.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.203.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.203.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.203.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.203.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.203.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.203.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.204.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.204.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.204.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.204.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.204.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.204.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.205.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.205.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.205.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.205.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.205.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.205.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.206.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.206.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.206.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.206.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.206.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.206.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.207.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.207.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.207.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.207.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.207.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.207.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.208.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.208.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.208.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.208.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.208.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.208.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.209.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.209.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.209.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.209.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.209.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.209.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.210.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.210.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.210.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.210.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.210.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.210.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.211.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.211.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.211.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.211.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.211.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.211.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.212.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.212.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.212.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.212.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.212.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.212.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.213.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.213.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.213.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.213.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.213.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.213.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.214.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.214.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.214.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.214.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.214.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.214.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.215.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.215.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.215.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.215.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.215.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.215.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.216.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.216.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.216.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.216.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.216.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.216.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.217.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.217.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.217.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.217.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.217.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.217.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.218.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.218.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.218.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.218.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.218.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.218.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.219.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.219.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.219.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.219.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.219.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.219.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.220.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.220.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.220.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.220.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.220.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.220.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.221.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.221.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.221.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.221.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.221.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.221.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.222.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.222.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.222.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.222.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.222.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.222.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.223.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.223.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.223.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.223.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.223.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.223.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.224.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.224.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.224.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.224.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.224.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.224.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.225.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.225.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.225.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.225.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.225.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.225.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.226.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.226.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.226.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.226.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.226.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.226.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.227.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.227.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.227.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.227.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.227.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.227.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.228.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.228.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.228.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.228.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.228.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.228.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.229.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.229.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.229.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.229.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.229.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.229.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.230.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.230.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.230.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.230.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.230.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.230.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.231.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.231.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.231.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.231.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.231.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.231.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.232.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.232.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.232.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.232.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.232.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.232.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.233.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.233.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.233.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.233.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.233.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.233.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.234.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.234.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.234.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.234.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.234.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.234.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.235.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.235.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.235.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.235.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.235.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.235.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.236.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.236.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.236.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.236.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.236.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.236.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.237.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.237.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.237.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.237.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.237.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.237.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.238.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.238.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.238.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.238.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.238.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.238.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.239.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.239.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.239.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.239.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.239.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.239.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.240.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.240.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.240.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.240.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.240.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.240.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.241.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.241.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.241.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.241.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.241.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.241.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.242.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.242.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.242.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.242.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.242.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.242.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.243.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.243.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.243.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.243.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.243.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.243.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.244.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.244.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.244.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.244.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.244.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.244.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.245.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.245.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.245.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.245.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.245.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.245.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.246.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.246.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.246.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.246.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.246.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.246.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.247.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.247.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.247.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.247.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.247.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.247.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.248.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.248.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.248.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.248.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.248.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.248.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.249.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.249.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.249.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.249.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.249.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.249.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.250.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.250.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.250.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.250.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.250.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.250.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.251.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.251.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.251.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.251.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.251.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.251.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.252.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.252.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.252.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.252.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.252.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.252.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.253.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.253.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.253.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.253.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.253.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.253.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.254.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.254.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.254.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.254.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.254.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.254.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.255.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.255.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.255.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.255.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.255.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.255.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.input_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.59.post_attention_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.q_a_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.q_a_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.q_a_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.q_b_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.q_b_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.kv_b_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.kv_b_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.o_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.o_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.gate.weight": "model-00158-of-000163.safetensors", "model.layers.60.mlp.gate.e_score_correction_bias": "model-00158-of-000163.safetensors", "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.shared_experts.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.shared_experts.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.0.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.0.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.0.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.0.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.0.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.1.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.1.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.1.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.1.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.1.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.2.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.2.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.2.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.2.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.2.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.3.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.3.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.3.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.3.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.3.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.4.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.4.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.4.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.4.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.4.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.5.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.5.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.5.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.5.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.5.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.6.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.6.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.6.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.6.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.6.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.7.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.7.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.7.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.7.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.7.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.8.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.8.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.8.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.8.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.8.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.9.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.9.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.9.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.9.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.9.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.10.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.10.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.10.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.10.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.10.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.11.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.11.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.11.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.11.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.11.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.12.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.12.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.12.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.12.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.12.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.13.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.13.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.13.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.13.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.13.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.14.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.14.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.14.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.14.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.14.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.15.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.15.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.15.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.15.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.15.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.16.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.16.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.16.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.16.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.16.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.17.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.17.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.17.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.17.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.17.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.18.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.18.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.18.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.18.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.18.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.19.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.19.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.19.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.19.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.19.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.20.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.20.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.20.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.20.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.20.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.21.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.21.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.21.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.21.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.21.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.22.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.22.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.22.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.22.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.22.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.23.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.23.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.23.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.23.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.23.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.24.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.24.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.24.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.24.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.24.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.25.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.25.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.25.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.25.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.25.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.26.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.26.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.26.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.26.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.26.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.27.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.27.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.27.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.27.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.27.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.28.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.28.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.28.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.28.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.28.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.29.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.29.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.29.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.29.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.29.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.30.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.30.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.30.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.30.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.30.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.31.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.31.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.31.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.31.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.31.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.32.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.32.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.32.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.32.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.32.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.33.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.33.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.33.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.33.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.33.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.34.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.34.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.34.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.34.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.34.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.35.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.35.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.35.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.35.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.35.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.36.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.36.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.36.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.36.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.36.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.37.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.37.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.37.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.37.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.37.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.38.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.38.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.38.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.38.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.38.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.39.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.39.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.39.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.39.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.39.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.40.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.40.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.40.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.40.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.40.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.41.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.41.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.41.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.41.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.41.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.42.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.42.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.42.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.42.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.42.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.43.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.43.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.43.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.43.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.43.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.44.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.44.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.44.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.44.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.44.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.45.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.45.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.45.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.45.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.45.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.46.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.46.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.46.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.46.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.46.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.47.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.47.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.47.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.47.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.47.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.48.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.48.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.48.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.48.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.48.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.49.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.49.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.49.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.49.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.49.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.50.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.50.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.50.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.50.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.50.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.51.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.51.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.51.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.51.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.51.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.52.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.52.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.52.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.52.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.52.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.53.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.53.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.53.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.53.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.53.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.54.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.54.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.54.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.54.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.54.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.55.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.55.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.55.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.55.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.55.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.56.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.56.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.56.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.56.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.56.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.57.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.57.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.57.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.57.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.57.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.58.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.58.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.58.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.58.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.58.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.59.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.59.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.59.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.59.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.59.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.60.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.60.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.60.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.60.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.60.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.61.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.61.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.61.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.61.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.61.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.62.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.62.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.62.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.62.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.62.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.63.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.63.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.63.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.63.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.63.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.64.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.64.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.64.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.64.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.64.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.65.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.65.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.65.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.65.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.65.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.66.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.66.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.66.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.66.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.66.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.67.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.67.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.67.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.67.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.67.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.68.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.68.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.68.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.68.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.68.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.69.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.69.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.69.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.69.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.69.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.70.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.70.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.70.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.70.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.70.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.71.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.71.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.71.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.71.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.71.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.72.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.72.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.72.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.72.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.72.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.73.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.73.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.73.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.73.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.73.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.74.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.74.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.74.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.74.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.74.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.75.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.75.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.75.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.75.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.75.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.76.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.76.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.76.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.76.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.76.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.77.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.77.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.77.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.77.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.77.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.78.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.78.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.78.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.78.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.78.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.79.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.79.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.79.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.79.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.79.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.80.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.80.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.80.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.80.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.80.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.81.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.81.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.81.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.81.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.81.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.82.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.82.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.82.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.82.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.82.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.83.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.83.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.83.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.83.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.83.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.84.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.84.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.84.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.84.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.84.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.85.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.85.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.85.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.85.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.85.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.86.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.86.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.86.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.86.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.86.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.87.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.87.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.87.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.87.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.87.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.88.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.88.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.88.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.88.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.88.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.89.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.89.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.89.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.89.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.89.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.90.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.90.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.90.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.90.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.90.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.91.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.91.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.91.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.91.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.91.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.92.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.92.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.92.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.92.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.92.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.93.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.93.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.93.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.93.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.93.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.94.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.94.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.94.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.94.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.94.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.95.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.95.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.95.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.95.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.95.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.96.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.96.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.96.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.96.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.96.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.97.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.97.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.97.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.97.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.97.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.98.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.98.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.98.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.98.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.98.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.99.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.99.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.99.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.99.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.99.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.100.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.100.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.100.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.100.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.100.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.101.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.101.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.101.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.101.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.101.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.102.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.102.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.102.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.102.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.102.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.103.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.103.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.103.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.103.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.103.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.104.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.104.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.104.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.104.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.104.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.105.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.105.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.105.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.105.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.105.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.106.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.106.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.106.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.106.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.106.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.107.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.107.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.107.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.107.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.107.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.108.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.108.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.108.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.108.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.108.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.109.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.109.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.109.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.109.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.109.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.110.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.110.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.110.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.110.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.110.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.111.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.111.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.111.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.111.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.111.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.112.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.112.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.112.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.112.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.112.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.113.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.113.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.113.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.113.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.113.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.114.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.114.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.114.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.114.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.114.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.115.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.115.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.115.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.115.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.115.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.116.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.116.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.116.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.116.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.116.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.117.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.117.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.117.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.117.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.117.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.118.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.118.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.118.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.118.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.118.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.119.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.119.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.119.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.119.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.119.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.120.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.120.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.120.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.120.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.120.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.121.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.121.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.121.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.121.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.121.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.122.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.122.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.122.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.122.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.122.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.123.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.123.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.123.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.123.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.123.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.124.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.124.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.124.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.124.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.124.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.125.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.125.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.125.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.125.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.125.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.126.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.126.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.126.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.126.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.126.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.127.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.127.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.127.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.127.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.127.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.128.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.128.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.128.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.128.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.128.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.129.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.129.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.129.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.129.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.129.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.130.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.130.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.130.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.130.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.130.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.131.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.131.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.131.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.131.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.131.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.132.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.132.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.132.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.132.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.132.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.133.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.133.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.133.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.133.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.133.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.134.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.134.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.134.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.134.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.134.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.135.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.135.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.135.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.135.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.135.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.136.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.136.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.136.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.136.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.136.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.137.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.137.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.137.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.137.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.137.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.138.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.138.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.138.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.138.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.138.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.139.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.139.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.139.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.139.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.139.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.140.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.140.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.140.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.140.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.140.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.141.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.141.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.141.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.141.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.141.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.142.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.142.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.142.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.142.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.142.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.143.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.143.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.143.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.143.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.143.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.144.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.144.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.144.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.144.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.144.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.145.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.145.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.145.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.145.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.145.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.146.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.146.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.146.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.146.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.146.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.147.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.147.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.147.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.147.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.147.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.148.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.148.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.148.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.148.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.148.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.149.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.149.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.149.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.149.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.149.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.150.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.150.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.150.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.150.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.150.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.151.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.151.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.151.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.151.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.151.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.152.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.152.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.152.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.152.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.152.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.153.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.153.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.153.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.153.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.153.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.154.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.154.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.154.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.154.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.154.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.155.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.155.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.155.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.155.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.155.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.156.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.156.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.156.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.156.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.156.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.157.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.157.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.157.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.157.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.157.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.158.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.158.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.158.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.158.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.158.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.159.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.159.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.159.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.159.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.159.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.160.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.160.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.160.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.160.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.160.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.160.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.161.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.161.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.161.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.161.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.161.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.161.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.162.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.162.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.162.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.162.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.162.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.162.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.163.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.163.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.163.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.163.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.163.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.163.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.164.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.164.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.164.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.164.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.164.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.164.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.165.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.165.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.165.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.165.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.165.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.165.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.166.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.166.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.166.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.166.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.166.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.166.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.167.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.167.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.167.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.167.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.167.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.167.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.168.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.168.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.168.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.168.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.168.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.168.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.169.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.169.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.169.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.169.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.169.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.169.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.170.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.170.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.170.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.170.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.170.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.170.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.171.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.171.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.171.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.171.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.171.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.171.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.172.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.172.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.172.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.172.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.172.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.172.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.173.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.173.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.173.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.173.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.173.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.173.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.174.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.174.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.174.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.174.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.174.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.174.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.175.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.175.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.175.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.175.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.175.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.175.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.176.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.176.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.176.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.176.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.176.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.176.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.177.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.177.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.177.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.177.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.177.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.177.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.178.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.178.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.178.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.178.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.178.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.178.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.179.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.179.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.179.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.179.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.179.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.179.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.180.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.180.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.180.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.180.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.180.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.180.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.181.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.181.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.181.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.181.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.181.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.181.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.182.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.182.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.182.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.182.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.182.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.182.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.183.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.183.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.183.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.183.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.183.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.183.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.184.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.184.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.184.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.184.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.184.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.184.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.185.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.185.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.185.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.185.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.185.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.185.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.186.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.186.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.186.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.186.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.186.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.186.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.187.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.187.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.187.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.187.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.187.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.187.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.188.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.188.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.188.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.188.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.188.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.188.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.189.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.189.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.189.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.189.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.189.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.189.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.190.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.190.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.190.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.190.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.190.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.190.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.191.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.191.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.191.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.191.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.191.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.191.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.192.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.192.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.192.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.192.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.192.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.192.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.193.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.193.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.193.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.193.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.193.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.193.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.194.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.194.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.194.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.194.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.194.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.194.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.195.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.195.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.195.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.195.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.195.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.195.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.196.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.196.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.196.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.196.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.196.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.196.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.197.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.197.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.197.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.197.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.197.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.197.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.198.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.198.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.198.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.198.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.198.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.198.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.199.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.199.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.199.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.199.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.199.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.199.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.200.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.200.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.200.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.200.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.200.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.200.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.201.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.201.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.201.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.201.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.201.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.201.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.202.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.202.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.202.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.202.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.202.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.202.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.203.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.203.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.203.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.203.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.203.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.203.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.204.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.204.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.204.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.204.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.204.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.204.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.205.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.205.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.205.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.205.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.205.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.205.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.206.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.206.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.206.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.206.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.206.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.206.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.207.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.207.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.207.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.207.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.207.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.207.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.208.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.208.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.208.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.208.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.208.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.208.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.209.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.209.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.209.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.209.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.209.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.209.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.210.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.210.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.210.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.210.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.210.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.210.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.211.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.211.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.211.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.211.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.211.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.211.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.212.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.212.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.212.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.212.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.212.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.212.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.213.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.213.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.213.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.213.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.213.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.213.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.214.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.214.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.214.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.214.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.214.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.214.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.215.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.215.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.215.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.215.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.215.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.215.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.216.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.216.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.216.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.216.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.216.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.216.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.217.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.217.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.217.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.217.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.217.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.217.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.218.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.218.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.218.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.218.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.218.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.218.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.219.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.219.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.219.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.219.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.219.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.219.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.220.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.220.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.220.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.220.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.220.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.220.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.221.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.221.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.221.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.221.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.221.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.221.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.222.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.222.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.222.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.222.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.222.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.222.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.223.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.223.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.223.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.223.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.223.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.223.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.224.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.224.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.224.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.224.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.224.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.224.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.225.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.225.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.225.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.225.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.225.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.225.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.226.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.226.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.226.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.226.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.226.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.226.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.227.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.227.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.227.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.227.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.227.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.227.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.228.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.228.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.228.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.228.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.228.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.228.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.229.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.229.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.229.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.229.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.229.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.229.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.230.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.230.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.230.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.230.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.230.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.230.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.231.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.231.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.231.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.231.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.231.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.231.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.232.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.232.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.232.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.232.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.232.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.232.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.233.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.233.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.233.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.233.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.233.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.233.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.234.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.234.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.234.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.234.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.234.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.234.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.235.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.235.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.235.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.235.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.235.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.235.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.236.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.236.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.236.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.236.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.236.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.236.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.237.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.237.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.237.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.237.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.237.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.237.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.238.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.238.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.238.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.238.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.238.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.238.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.239.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.239.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.239.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.239.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.239.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.239.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.240.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.240.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.240.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.240.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.240.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.240.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.241.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.241.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.241.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.241.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.241.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.241.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.242.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.242.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.242.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.242.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.242.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.242.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.243.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.243.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.243.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.243.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.243.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.243.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.244.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.244.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.244.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.244.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.244.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.244.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.245.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.245.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.245.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.245.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.245.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.245.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.246.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.246.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.246.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.246.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.246.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.246.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.247.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.247.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.247.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.247.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.247.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.247.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.248.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.248.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.248.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.248.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.248.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.248.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.249.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.249.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.249.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.249.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.249.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.249.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.250.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.250.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.250.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.250.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.250.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.250.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.251.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.251.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.251.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.251.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.251.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.251.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.252.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.252.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.252.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.252.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.252.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.252.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.253.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.253.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.253.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.253.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.253.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.253.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.254.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.254.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.254.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.254.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.254.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.254.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.255.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.255.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.255.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.255.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.255.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.255.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.input_layernorm.weight": "model-00160-of-000163.safetensors", "model.layers.60.post_attention_layernorm.weight": "model-00160-of-000163.safetensors", "model.norm.weight": "model-00160-of-000163.safetensors", "lm_head.weight": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.q_a_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.q_a_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.q_a_layernorm.weight": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.q_b_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.q_b_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.kv_a_proj_with_mqa.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.kv_a_layernorm.weight": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.kv_b_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.kv_b_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.o_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.o_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.mlp.gate.weight": "model-00160-of-000163.safetensors", "model.layers.61.mlp.gate.e_score_correction_bias": "model-00160-of-000163.safetensors", "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.mlp.shared_experts.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.mlp.shared_experts.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.0.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.0.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.0.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.0.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.0.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.1.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.1.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.1.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.1.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.1.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.2.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.2.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.2.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.2.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.2.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.3.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.3.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.3.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.3.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.3.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.4.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.4.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.4.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.4.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.4.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.5.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.5.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.5.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.5.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.5.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.6.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.6.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.6.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.6.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.6.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.7.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.7.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.7.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.7.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.7.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.8.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.8.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.8.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.8.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.8.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.9.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.9.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.9.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.9.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.9.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.10.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.10.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.10.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.10.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.10.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.11.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.11.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.11.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.11.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.11.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.12.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.12.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.12.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.12.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.12.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.13.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.13.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.13.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.13.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.13.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.14.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.14.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.14.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.14.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.14.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.15.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.15.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.15.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.15.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.15.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.16.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.16.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.16.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.16.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.16.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.17.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.17.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.17.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.17.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.17.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.18.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.18.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.18.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.18.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.18.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.19.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.19.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.19.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.19.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.19.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.20.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.20.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.20.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.20.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.20.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.21.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.21.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.21.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.21.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.21.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.22.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.22.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.22.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.22.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.22.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.23.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.23.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.23.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.23.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.23.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.24.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.24.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.24.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.24.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.24.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.25.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.25.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.25.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.25.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.25.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.26.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.26.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.26.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.26.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.26.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.27.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.27.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.27.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.27.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.27.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.28.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.28.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.28.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.28.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.28.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.29.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.29.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.29.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.29.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.29.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.30.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.30.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.30.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.30.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.30.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.31.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.31.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.31.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.31.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.31.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.32.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.32.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.32.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.32.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.32.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.33.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.33.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.33.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.33.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.33.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.34.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.34.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.34.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.34.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.34.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.35.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.35.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.35.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.35.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.35.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.36.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.36.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.36.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.36.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.36.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.37.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.37.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.37.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.37.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.37.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.38.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.38.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.38.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.38.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.38.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.39.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.39.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.39.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.39.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.39.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.40.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.40.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.40.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.40.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.40.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.41.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.41.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.41.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.41.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.41.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.42.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.42.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.42.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.42.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.42.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.43.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.43.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.43.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.43.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.43.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.44.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.44.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.44.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.44.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.44.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.45.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.45.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.45.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.45.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.45.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.46.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.46.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.46.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.46.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.46.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.47.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.47.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.47.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.47.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.47.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.48.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.48.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.48.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.48.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.48.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.49.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.49.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.49.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.49.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.49.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.50.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.50.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.50.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.50.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.50.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.51.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.51.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.51.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.51.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.51.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.52.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.52.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.52.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.52.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.52.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.53.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.53.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.53.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.53.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.53.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.54.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.54.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.54.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.54.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.54.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.55.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.55.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.55.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.55.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.55.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.56.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.56.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.56.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.56.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.56.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.57.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.57.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.57.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.57.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.57.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.58.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.58.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.58.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.58.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.58.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.59.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.59.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.59.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.59.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.59.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.60.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.60.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.60.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.60.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.60.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.61.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.61.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.61.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.61.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.61.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.62.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.62.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.62.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.62.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.62.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.63.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.63.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.63.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.63.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.63.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.64.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.64.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.64.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.64.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.64.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.65.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.65.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.65.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.65.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.65.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.66.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.66.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.66.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.66.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.66.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.67.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.67.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.67.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.67.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.67.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.68.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.68.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.68.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.68.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.68.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.69.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.69.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.69.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.69.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.69.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.70.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.70.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.70.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.70.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.70.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.71.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.71.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.71.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.71.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.71.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.72.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.72.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.72.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.72.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.72.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.73.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.73.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.73.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.73.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.73.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.74.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.74.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.74.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.74.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.74.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.75.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.75.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.75.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.75.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.75.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.76.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.76.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.76.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.76.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.76.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.77.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.77.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.77.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.77.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.77.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.78.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.78.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.78.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.78.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.78.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.79.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.79.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.79.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.79.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.79.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.80.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.80.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.80.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.80.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.80.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.81.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.81.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.81.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.81.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.81.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.82.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.82.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.82.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.82.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.82.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.83.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.83.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.83.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.83.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.83.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.84.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.84.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.84.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.84.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.84.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.85.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.85.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.85.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.85.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.85.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.86.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.86.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.86.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.86.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.86.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.87.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.87.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.87.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.87.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.87.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.88.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.88.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.88.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.88.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.88.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.89.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.89.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.89.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.89.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.89.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.90.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.90.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.90.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.90.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.90.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.91.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.91.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.91.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.91.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.91.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.92.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.92.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.92.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.92.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.92.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.93.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.93.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.93.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.93.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.93.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.94.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.94.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.94.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.94.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.94.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.95.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.95.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.95.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.95.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.95.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.96.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.96.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.96.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.96.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.96.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.97.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.97.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.97.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.97.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.97.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.98.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.98.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.98.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.98.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.98.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.99.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.99.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.99.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.99.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.99.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.100.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.100.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.100.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.100.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.100.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.101.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.101.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.101.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.101.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.101.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.102.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.102.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.102.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.102.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.102.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.103.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.103.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.103.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.103.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.103.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.104.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.104.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.104.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.104.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.104.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.105.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.105.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.105.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.105.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.105.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.106.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.106.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.106.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.106.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.106.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.107.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.107.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.107.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.107.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.107.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.108.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.108.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.108.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.108.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.108.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.109.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.109.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.109.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.109.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.109.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.110.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.110.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.110.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.110.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.110.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.111.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.111.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.111.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.111.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.111.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.112.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.112.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.112.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.112.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.112.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.113.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.113.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.113.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.113.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.113.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.114.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.114.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.114.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.114.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.114.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.115.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.115.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.115.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.115.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.115.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.116.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.116.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.116.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.116.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.116.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.117.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.117.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.117.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.117.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.117.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.118.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.118.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.118.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.118.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.118.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.119.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.119.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.119.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.119.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.119.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.120.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.120.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.120.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.120.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.120.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.121.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.121.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.121.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.121.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.121.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.122.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.122.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.122.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.122.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.122.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.123.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.123.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.123.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.123.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.123.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.124.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.124.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.124.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.124.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.124.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.125.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.125.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.125.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.125.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.125.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.126.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.126.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.126.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.126.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.126.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.127.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.127.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.127.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.127.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.127.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.128.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.128.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.128.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.128.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.128.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.129.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.129.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.129.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.129.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.129.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.130.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.130.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.130.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.130.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.130.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.131.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.131.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.131.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.131.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.131.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.132.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.132.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.132.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.132.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.132.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.133.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.133.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.133.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.133.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.133.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.134.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.134.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.134.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.134.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.134.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.135.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.135.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.135.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.135.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.135.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.136.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.136.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.136.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.136.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.136.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.137.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.137.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.137.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.137.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.137.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.138.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.138.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.138.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.138.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.138.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.139.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.139.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.139.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.139.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.139.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.140.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.140.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.140.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.140.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.140.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.141.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.141.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.141.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.141.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.141.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.142.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.142.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.142.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.142.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.142.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.143.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.143.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.143.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.143.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.143.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.144.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.144.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.144.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.144.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.144.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.145.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.145.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.145.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.145.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.145.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.146.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.146.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.146.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.146.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.146.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.147.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.147.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.147.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.147.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.147.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.148.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.148.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.148.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.148.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.148.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.149.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.149.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.149.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.149.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.149.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.150.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.150.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.150.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.150.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.150.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.151.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.151.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.151.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.151.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.151.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.152.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.152.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.152.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.152.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.152.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.153.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.153.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.153.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.153.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.153.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.154.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.154.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.154.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.154.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.154.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.155.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.155.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.155.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.155.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.155.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.156.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.156.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.156.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.156.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.156.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.157.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.157.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.157.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.157.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.157.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.158.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.158.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.158.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.158.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.158.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.159.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.159.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.159.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.159.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.159.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.160.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.160.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.160.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.160.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.160.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.160.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.161.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.161.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.161.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.161.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.161.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.161.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.162.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.162.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.162.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.162.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.162.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.162.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.163.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.163.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.163.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.163.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.163.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.163.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.164.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.164.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.164.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.164.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.164.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.164.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.165.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.165.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.165.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.165.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.165.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.165.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.166.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.166.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.166.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.166.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.166.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.166.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.167.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.167.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.167.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.167.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.167.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.167.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.168.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.168.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.168.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.168.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.168.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.168.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.169.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.169.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.169.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.169.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.169.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.169.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.170.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.170.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.170.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.170.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.170.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.170.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.171.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.171.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.171.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.171.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.171.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.171.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.172.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.172.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.172.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.172.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.172.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.172.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.173.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.173.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.173.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.173.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.173.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.173.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.174.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.174.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.174.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.174.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.174.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.174.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.175.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.175.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.175.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.175.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.175.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.175.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.176.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.176.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.176.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.176.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.176.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.176.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.177.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.177.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.177.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.177.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.177.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.177.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.178.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.178.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.178.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.178.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.178.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.178.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.179.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.179.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.179.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.179.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.179.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.179.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.180.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.180.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.180.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.180.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.180.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.180.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.181.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.181.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.181.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.181.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.181.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.181.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.182.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.182.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.182.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.182.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.182.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.182.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.183.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.183.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.183.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.183.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.183.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.183.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.184.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.184.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.184.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.184.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.184.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.184.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.185.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.185.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.185.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.185.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.185.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.185.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.186.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.186.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.186.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.186.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.186.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.186.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.187.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.187.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.187.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.187.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.187.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.187.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.188.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.188.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.188.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.188.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.188.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.188.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.189.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.189.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.189.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.189.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.189.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.189.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.190.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.190.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.190.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.190.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.190.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.190.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.191.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.191.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.191.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.191.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.191.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.191.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.192.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.192.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.192.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.192.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.192.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.192.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.193.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.193.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.193.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.193.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.193.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.193.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.194.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.194.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.194.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.194.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.194.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.194.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.195.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.195.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.195.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.195.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.195.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.195.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.196.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.196.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.196.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.196.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.196.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.196.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.197.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.197.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.197.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.197.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.197.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.197.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.198.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.198.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.198.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.198.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.198.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.198.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.199.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.199.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.199.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.199.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.199.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.199.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.200.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.200.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.200.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.200.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.200.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.200.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.201.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.201.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.201.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.201.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.201.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.201.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.202.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.202.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.202.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.202.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.202.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.202.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.203.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.203.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.203.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.203.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.203.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.203.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.204.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.204.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.204.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.204.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.204.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.204.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.205.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.205.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.205.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.205.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.205.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.205.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.206.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.206.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.206.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.206.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.206.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.206.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.207.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.207.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.207.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.207.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.207.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.207.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.208.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.208.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.208.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.208.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.208.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.208.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.209.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.209.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.209.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.209.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.209.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.209.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.210.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.210.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.210.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.210.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.210.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.210.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.211.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.211.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.211.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.211.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.211.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.211.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.212.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.212.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.212.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.212.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.212.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.212.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.213.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.213.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.213.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.213.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.213.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.213.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.214.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.214.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.214.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.214.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.214.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.214.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.215.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.215.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.215.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.215.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.215.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.215.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.216.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.216.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.216.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.216.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.216.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.216.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.217.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.217.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.217.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.217.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.217.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.217.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.218.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.218.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.218.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.218.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.218.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.218.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.219.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.219.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.219.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.219.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.219.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.219.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.220.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.220.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.220.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.220.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.220.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.220.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.221.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.221.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.221.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.221.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.221.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.221.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.222.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.222.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.222.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.222.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.222.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.222.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.223.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.223.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.223.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.223.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.223.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.223.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.224.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.224.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.224.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.224.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.224.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.224.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.225.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.225.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.225.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.225.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.225.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.225.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.226.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.226.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.226.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.226.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.226.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.226.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.227.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.227.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.227.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.227.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.227.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.227.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.228.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.228.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.228.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.228.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.228.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.228.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.229.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.229.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.229.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.229.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.229.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.229.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.230.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.230.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.230.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.230.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.230.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.230.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.231.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.231.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.231.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.231.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.231.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.231.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.232.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.232.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.232.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.232.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.232.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.232.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.233.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.233.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.233.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.233.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.233.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.233.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.234.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.234.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.234.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.234.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.234.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.234.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.235.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.235.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.235.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.235.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.235.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.235.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.236.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.236.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.236.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.236.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.236.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.236.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.237.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.237.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.237.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.237.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.237.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.237.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.238.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.238.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.238.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.238.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.238.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.238.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.239.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.239.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.239.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.239.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.239.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.239.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.240.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.240.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.240.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.240.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.240.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.240.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.241.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.241.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.241.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.241.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.241.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.241.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.242.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.242.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.242.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.242.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.242.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.242.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.243.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.243.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.243.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.243.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.243.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.243.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.244.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.244.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.244.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.244.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.244.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.244.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.245.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.245.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.245.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.245.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.245.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.245.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.246.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.246.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.246.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.246.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.246.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.246.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.247.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.247.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.247.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.247.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.247.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.247.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.248.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.248.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.248.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.248.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.248.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.248.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.249.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.249.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.249.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.249.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.249.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.249.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.250.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.250.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.250.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.250.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.250.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.250.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.251.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.251.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.251.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.251.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.251.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.251.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.252.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.252.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.252.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.252.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.252.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.252.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.253.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.253.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.253.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.253.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.253.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.253.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.254.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.254.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.254.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.254.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.254.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.254.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.255.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.255.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.255.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.255.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.255.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.255.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.input_layernorm.weight": "model-00163-of-000163.safetensors", "model.layers.61.post_attention_layernorm.weight": "model-00163-of-000163.safetensors", "model.layers.61.embed_tokens.weight": "model-00163-of-000163.safetensors",